/te2/text_model/embeddings/token_embedding/Gather:Gather*input:te2_2E_text_5F_model_2E_embeddings_2E_token_5F_embedding_2E_weight.bin(float32:49408,1280);input_5F_ids(1,77)*output:_2F_te2_2F_text_5F_model_2F_embeddings_2F_token_5F_embedding_2F_Gather_5F_output_5F_0(1,77,1280) /te2/text_model/embeddings/Add:Add*input:_2F_te2_2F_text_5F_model_2F_embeddings_2F_token_5F_embedding_2F_Gather_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_embeddings_2F_position_5F_embedding_2F_Gather_5F_output_5F_0.bin(float32:1,77,1280)*output:out_5F_2(1,77,1280) /te2/text_model/encoder/layers.0/layer_norm1/ReduceMean:ReduceMean*input:out_5F_2(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.0/layer_norm1/Sub:Sub*input:out_5F_2(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.0/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.0/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.0/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);2971.bin(float32:1280,3840)*output:2972(1,77,3840) :Split*input:2972(1,77,3840);2976.bin(int64:3)*output:2973(1,77,1280);2974(1,77,1280);2975(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.0/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);2973(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);2974(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.0/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.0/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);2975(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.0/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.0/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.0/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.0/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.0/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.0/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.0/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.0/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.0/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.0/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.0/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.0/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.0/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.0/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.0/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.0/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.0/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_5662.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/Add:Add*input:out_5F_2(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.0/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.0/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.0/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.0/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_5663.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.0/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_0_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.0/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.0/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.0/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.0/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.0/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.0/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_5664.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_0_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.0/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_3(1,77,1280) /te2/text_model/encoder/layers.1/layer_norm1/ReduceMean:ReduceMean*input:out_5F_3(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.1/layer_norm1/Sub:Sub*input:out_5F_3(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.1/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.1/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.1/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);2978.bin(float32:1280,3840)*output:2979(1,77,3840) :Split*input:2979(1,77,3840);2976.bin(int64:3)*output:2980(1,77,1280);2981(1,77,1280);2982(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.1/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);2980(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);2981(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.1/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.1/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);2982(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.1/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.1/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.1/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.1/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.1/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.1/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.1/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.1/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.1/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.1/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.1/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.1/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.1/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.1/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.1/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.1/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.1/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_5713.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/Add:Add*input:out_5F_3(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.1/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.1/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.1/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.1/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_5714.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.1/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_1_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.1/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.1/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.1/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.1/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.1/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.1/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_5715.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_1_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_1_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_4(1,77,1280) /te2/text_model/encoder/layers.2/layer_norm1/ReduceMean:ReduceMean*input:out_5F_4(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.2/layer_norm1/Sub:Sub*input:out_5F_4(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.2/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.2/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.2/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);2985.bin(float32:1280,3840)*output:2986(1,77,3840) :Split*input:2986(1,77,3840);2976.bin(int64:3)*output:2987(1,77,1280);2988(1,77,1280);2989(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.2/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);2987(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);2988(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.2/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.2/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);2989(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.2/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.2/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.2/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.2/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.2/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.2/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.2/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.2/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.2/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.2/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.2/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.2/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.2/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.2/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.2/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.2/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.2/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_5764.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/Add:Add*input:out_5F_4(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.2/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.2/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.2/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.2/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_5765.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.2/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_2_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.2/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.2/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.2/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.2/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.2/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.2/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_5766.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_2_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_2_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_5(1,77,1280) /te2/text_model/encoder/layers.3/layer_norm1/ReduceMean:ReduceMean*input:out_5F_5(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.3/layer_norm1/Sub:Sub*input:out_5F_5(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.3/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.3/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.3/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);2992.bin(float32:1280,3840)*output:2993(1,77,3840) :Split*input:2993(1,77,3840);2976.bin(int64:3)*output:2994(1,77,1280);2995(1,77,1280);2996(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.3/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);2994(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);2995(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.3/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.3/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);2996(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.3/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.3/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.3/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.3/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.3/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.3/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.3/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.3/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.3/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.3/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.3/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.3/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.3/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.3/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.3/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.3/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.3/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_5815.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/Add:Add*input:out_5F_5(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.3/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.3/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.3/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.3/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_5816.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.3/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_3_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.3/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.3/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.3/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.3/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.3/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.3/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_5817.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_3_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.3/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_3_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_6(1,77,1280) /te2/text_model/encoder/layers.4/layer_norm1/ReduceMean:ReduceMean*input:out_5F_6(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.4/layer_norm1/Sub:Sub*input:out_5F_6(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.4/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.4/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.4/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);2999.bin(float32:1280,3840)*output:3000(1,77,3840) :Split*input:3000(1,77,3840);2976.bin(int64:3)*output:3001(1,77,1280);3002(1,77,1280);3003(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.4/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3001(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3002(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.4/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.4/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3003(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.4/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.4/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.4/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.4/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.4/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.4/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.4/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.4/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.4/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.4/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.4/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.4/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.4/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.4/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.4/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.4/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.4/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_5866.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/Add:Add*input:out_5F_6(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.4/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.4/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.4/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.4/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_5867.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.4/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_4_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.4/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.4/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.4/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.4/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.4/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.4/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_5868.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_4_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.4/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_4_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_7(1,77,1280) /te2/text_model/encoder/layers.5/layer_norm1/ReduceMean:ReduceMean*input:out_5F_7(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.5/layer_norm1/Sub:Sub*input:out_5F_7(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.5/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.5/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.5/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3006.bin(float32:1280,3840)*output:3007(1,77,3840) :Split*input:3007(1,77,3840);2976.bin(int64:3)*output:3008(1,77,1280);3009(1,77,1280);3010(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.5/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3008(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3009(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.5/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.5/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3010(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.5/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.5/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.5/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.5/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.5/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.5/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.5/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.5/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.5/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.5/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.5/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.5/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.5/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.5/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.5/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.5/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.5/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_5917.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/Add:Add*input:out_5F_7(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.5/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.5/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.5/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.5/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_5918.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.5/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_5_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.5/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.5/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.5/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.5/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.5/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.5/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_5919.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_5_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.5/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_5_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_8(1,77,1280) /te2/text_model/encoder/layers.6/layer_norm1/ReduceMean:ReduceMean*input:out_5F_8(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.6/layer_norm1/Sub:Sub*input:out_5F_8(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.6/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.6/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.6/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3013.bin(float32:1280,3840)*output:3014(1,77,3840) :Split*input:3014(1,77,3840);2976.bin(int64:3)*output:3015(1,77,1280);3016(1,77,1280);3017(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.6/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3015(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3016(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.6/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.6/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3017(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.6/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.6/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.6/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.6/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.6/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.6/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.6/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.6/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.6/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.6/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.6/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.6/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.6/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.6/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.6/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.6/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.6/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_5968.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/Add:Add*input:out_5F_8(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.6/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.6/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.6/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.6/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_5969.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.6/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_6_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.6/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.6/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.6/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.6/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.6/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.6/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_5970.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_6_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.6/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_6_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_9(1,77,1280) /te2/text_model/encoder/layers.7/layer_norm1/ReduceMean:ReduceMean*input:out_5F_9(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.7/layer_norm1/Sub:Sub*input:out_5F_9(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.7/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.7/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.7/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3020.bin(float32:1280,3840)*output:3021(1,77,3840) :Split*input:3021(1,77,3840);2976.bin(int64:3)*output:3022(1,77,1280);3023(1,77,1280);3024(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.7/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3022(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3023(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.7/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.7/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3024(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.7/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.7/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.7/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.7/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.7/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.7/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.7/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.7/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.7/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.7/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.7/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.7/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.7/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.7/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.7/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.7/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.7/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6019.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/Add:Add*input:out_5F_9(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.7/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.7/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.7/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.7/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6020.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.7/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_7_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.7/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.7/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.7/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.7/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.7/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.7/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6021.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_7_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.7/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_7_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_10(1,77,1280) /te2/text_model/encoder/layers.8/layer_norm1/ReduceMean:ReduceMean*input:out_5F_10(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.8/layer_norm1/Sub:Sub*input:out_5F_10(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.8/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.8/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.8/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3027.bin(float32:1280,3840)*output:3028(1,77,3840) :Split*input:3028(1,77,3840);2976.bin(int64:3)*output:3029(1,77,1280);3030(1,77,1280);3031(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.8/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3029(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3030(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.8/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.8/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3031(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.8/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.8/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.8/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.8/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.8/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.8/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.8/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.8/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.8/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.8/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.8/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.8/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.8/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.8/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.8/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.8/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.8/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6070.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/Add:Add*input:out_5F_10(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.8/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.8/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.8/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.8/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6071.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.8/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_8_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.8/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.8/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.8/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.8/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.8/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.8/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6072.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_8_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.8/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_8_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_11(1,77,1280) /te2/text_model/encoder/layers.9/layer_norm1/ReduceMean:ReduceMean*input:out_5F_11(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.9/layer_norm1/Sub:Sub*input:out_5F_11(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.9/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.9/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.9/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3034.bin(float32:1280,3840)*output:3035(1,77,3840) :Split*input:3035(1,77,3840);2976.bin(int64:3)*output:3036(1,77,1280);3037(1,77,1280);3038(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.9/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3036(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3037(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.9/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.9/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3038(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.9/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.9/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.9/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.9/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.9/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.9/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.9/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.9/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.9/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.9/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.9/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.9/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.9/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.9/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.9/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.9/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.9/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6121.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/Add:Add*input:out_5F_11(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.9/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.9/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.9/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.9/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6122.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.9/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_9_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.9/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.9/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.9/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.9/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.9/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.9/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6123.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_9_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.9/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_9_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_12(1,77,1280) /te2/text_model/encoder/layers.10/layer_norm1/ReduceMean:ReduceMean*input:out_5F_12(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.10/layer_norm1/Sub:Sub*input:out_5F_12(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.10/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.10/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.10/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3041.bin(float32:1280,3840)*output:3042(1,77,3840) :Split*input:3042(1,77,3840);2976.bin(int64:3)*output:3043(1,77,1280);3044(1,77,1280);3045(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.10/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3043(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3044(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.10/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.10/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3045(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.10/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.10/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.10/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.10/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.10/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.10/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.10/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.10/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.10/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.10/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.10/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.10/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.10/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.10/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.10/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.10/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.10/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6172.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/Add:Add*input:out_5F_12(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.10/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.10/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.10/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.10/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6173.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.10/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_10_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.10/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.10/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.10/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.10/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.10/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.10/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6174.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_10_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.10/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_10_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_13(1,77,1280) /te2/text_model/encoder/layers.11/layer_norm1/ReduceMean:ReduceMean*input:out_5F_13(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.11/layer_norm1/Sub:Sub*input:out_5F_13(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.11/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.11/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.11/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3048.bin(float32:1280,3840)*output:3049(1,77,3840) :Split*input:3049(1,77,3840);2976.bin(int64:3)*output:3050(1,77,1280);3051(1,77,1280);3052(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.11/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3050(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3051(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.11/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.11/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3052(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.11/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.11/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.11/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.11/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.11/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.11/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.11/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.11/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.11/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.11/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.11/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.11/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.11/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.11/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.11/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.11/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.11/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6223.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/Add:Add*input:out_5F_13(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.11/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.11/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.11/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.11/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6224.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.11/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_11_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.11/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.11/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.11/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.11/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.11/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.11/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6225.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_11_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.11/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_11_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_14(1,77,1280) /te2/text_model/encoder/layers.12/layer_norm1/ReduceMean:ReduceMean*input:out_5F_14(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.12/layer_norm1/Sub:Sub*input:out_5F_14(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.12/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.12/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.12/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_12_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_12_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3055.bin(float32:1280,3840)*output:3056(1,77,3840) :Split*input:3056(1,77,3840);2976.bin(int64:3)*output:3057(1,77,1280);3058(1,77,1280);3059(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.12/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_12_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3057(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_12_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3058(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.12/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.12/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_12_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3059(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.12/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.12/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.12/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.12/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.12/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.12/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.12/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.12/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.12/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.12/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.12/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.12/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.12/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.12/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.12/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.12/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.12/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6274.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_12_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/Add:Add*input:out_5F_14(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.12/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.12/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.12/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.12/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_12_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_12_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6275.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.12/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_12_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.12/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.12/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.12/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.12/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.12/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.12/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6276.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_12_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.12/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_12_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_15(1,77,1280) /te2/text_model/encoder/layers.13/layer_norm1/ReduceMean:ReduceMean*input:out_5F_15(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.13/layer_norm1/Sub:Sub*input:out_5F_15(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.13/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.13/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.13/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_13_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_13_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3062.bin(float32:1280,3840)*output:3063(1,77,3840) :Split*input:3063(1,77,3840);2976.bin(int64:3)*output:3064(1,77,1280);3065(1,77,1280);3066(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.13/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_13_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3064(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_13_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3065(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.13/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.13/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_13_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3066(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.13/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.13/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.13/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.13/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.13/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.13/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.13/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.13/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.13/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.13/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.13/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.13/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.13/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.13/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.13/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.13/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.13/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6325.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_13_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/Add:Add*input:out_5F_15(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.13/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.13/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.13/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.13/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_13_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_13_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6326.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.13/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_13_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.13/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.13/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.13/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.13/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.13/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.13/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6327.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_13_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.13/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_13_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_16(1,77,1280) /te2/text_model/encoder/layers.14/layer_norm1/ReduceMean:ReduceMean*input:out_5F_16(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.14/layer_norm1/Sub:Sub*input:out_5F_16(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.14/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.14/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.14/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_14_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_14_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3069.bin(float32:1280,3840)*output:3070(1,77,3840) :Split*input:3070(1,77,3840);2976.bin(int64:3)*output:3071(1,77,1280);3072(1,77,1280);3073(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.14/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_14_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3071(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_14_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3072(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.14/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.14/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_14_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3073(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.14/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.14/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.14/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.14/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.14/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.14/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.14/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.14/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.14/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.14/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.14/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.14/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.14/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.14/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.14/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.14/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.14/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6376.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_14_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/Add:Add*input:out_5F_16(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.14/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.14/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.14/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.14/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_14_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_14_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6377.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.14/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_14_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.14/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.14/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.14/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.14/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.14/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.14/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6378.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_14_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.14/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_14_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_17(1,77,1280) /te2/text_model/encoder/layers.15/layer_norm1/ReduceMean:ReduceMean*input:out_5F_17(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.15/layer_norm1/Sub:Sub*input:out_5F_17(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.15/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.15/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.15/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_15_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_15_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3076.bin(float32:1280,3840)*output:3077(1,77,3840) :Split*input:3077(1,77,3840);2976.bin(int64:3)*output:3078(1,77,1280);3079(1,77,1280);3080(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.15/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_15_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3078(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_15_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3079(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.15/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.15/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_15_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3080(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.15/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.15/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.15/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.15/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.15/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.15/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.15/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.15/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.15/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.15/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.15/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.15/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.15/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.15/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.15/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.15/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.15/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6427.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_15_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/Add:Add*input:out_5F_17(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.15/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.15/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.15/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.15/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_15_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_15_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6428.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.15/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_15_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.15/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.15/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.15/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.15/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.15/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.15/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6429.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_15_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.15/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_15_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_18(1,77,1280) /te2/text_model/encoder/layers.16/layer_norm1/ReduceMean:ReduceMean*input:out_5F_18(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.16/layer_norm1/Sub:Sub*input:out_5F_18(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.16/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.16/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.16/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_16_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_16_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3083.bin(float32:1280,3840)*output:3084(1,77,3840) :Split*input:3084(1,77,3840);2976.bin(int64:3)*output:3085(1,77,1280);3086(1,77,1280);3087(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.16/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_16_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3085(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_16_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3086(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.16/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.16/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_16_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3087(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.16/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.16/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.16/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.16/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.16/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.16/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.16/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.16/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.16/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.16/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.16/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.16/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.16/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.16/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.16/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.16/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.16/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6478.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_16_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/Add:Add*input:out_5F_18(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.16/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.16/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.16/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.16/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_16_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_16_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6479.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.16/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_16_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.16/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.16/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.16/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.16/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.16/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.16/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6480.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_16_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.16/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_16_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_19(1,77,1280) /te2/text_model/encoder/layers.17/layer_norm1/ReduceMean:ReduceMean*input:out_5F_19(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.17/layer_norm1/Sub:Sub*input:out_5F_19(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.17/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.17/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.17/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_17_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_17_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3090.bin(float32:1280,3840)*output:3091(1,77,3840) :Split*input:3091(1,77,3840);2976.bin(int64:3)*output:3092(1,77,1280);3093(1,77,1280);3094(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.17/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_17_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3092(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_17_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3093(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.17/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.17/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_17_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3094(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.17/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.17/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.17/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.17/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.17/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.17/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.17/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.17/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.17/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.17/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.17/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.17/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.17/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.17/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.17/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.17/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.17/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6529.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_17_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/Add:Add*input:out_5F_19(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.17/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.17/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.17/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.17/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_17_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_17_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6530.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.17/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_17_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.17/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.17/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.17/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.17/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.17/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.17/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6531.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_17_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.17/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_17_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_20(1,77,1280) /te2/text_model/encoder/layers.18/layer_norm1/ReduceMean:ReduceMean*input:out_5F_20(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.18/layer_norm1/Sub:Sub*input:out_5F_20(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.18/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.18/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.18/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_18_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_18_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3097.bin(float32:1280,3840)*output:3098(1,77,3840) :Split*input:3098(1,77,3840);2976.bin(int64:3)*output:3099(1,77,1280);3100(1,77,1280);3101(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.18/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_18_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3099(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_18_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3100(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.18/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.18/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_18_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3101(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.18/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.18/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.18/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.18/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.18/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.18/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.18/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.18/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.18/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.18/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.18/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.18/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.18/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.18/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.18/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.18/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.18/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6580.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_18_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/Add:Add*input:out_5F_20(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.18/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.18/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.18/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.18/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_18_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_18_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6581.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.18/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_18_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.18/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.18/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.18/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.18/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.18/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.18/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6582.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_18_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.18/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_18_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_21(1,77,1280) /te2/text_model/encoder/layers.19/layer_norm1/ReduceMean:ReduceMean*input:out_5F_21(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.19/layer_norm1/Sub:Sub*input:out_5F_21(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.19/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.19/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.19/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_19_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_19_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3104.bin(float32:1280,3840)*output:3105(1,77,3840) :Split*input:3105(1,77,3840);2976.bin(int64:3)*output:3106(1,77,1280);3107(1,77,1280);3108(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.19/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_19_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3106(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_19_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3107(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.19/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.19/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_19_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3108(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.19/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.19/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.19/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.19/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.19/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.19/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.19/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.19/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.19/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.19/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.19/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.19/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.19/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.19/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.19/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.19/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.19/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6631.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_19_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/Add:Add*input:out_5F_21(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.19/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.19/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.19/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.19/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_19_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_19_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6632.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.19/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_19_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.19/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.19/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.19/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.19/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.19/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.19/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6633.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_19_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.19/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_19_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_22(1,77,1280) /te2/text_model/encoder/layers.20/layer_norm1/ReduceMean:ReduceMean*input:out_5F_22(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.20/layer_norm1/Sub:Sub*input:out_5F_22(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.20/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.20/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.20/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_20_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_20_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3111.bin(float32:1280,3840)*output:3112(1,77,3840) :Split*input:3112(1,77,3840);2976.bin(int64:3)*output:3113(1,77,1280);3114(1,77,1280);3115(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.20/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_20_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3113(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_20_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3114(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.20/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.20/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_20_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3115(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.20/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.20/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.20/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.20/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.20/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.20/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.20/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.20/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.20/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.20/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.20/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.20/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.20/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.20/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.20/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.20/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.20/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6682.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_20_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/Add:Add*input:out_5F_22(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.20/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.20/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.20/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.20/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_20_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_20_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6683.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.20/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_20_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.20/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.20/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.20/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.20/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.20/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.20/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6684.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_20_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.20/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_20_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_23(1,77,1280) /te2/text_model/encoder/layers.21/layer_norm1/ReduceMean:ReduceMean*input:out_5F_23(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.21/layer_norm1/Sub:Sub*input:out_5F_23(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.21/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.21/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.21/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_21_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_21_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3118.bin(float32:1280,3840)*output:3119(1,77,3840) :Split*input:3119(1,77,3840);2976.bin(int64:3)*output:3120(1,77,1280);3121(1,77,1280);3122(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.21/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_21_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3120(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_21_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3121(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.21/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.21/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_21_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3122(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.21/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.21/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.21/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.21/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.21/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.21/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.21/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.21/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.21/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.21/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.21/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.21/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.21/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.21/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.21/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.21/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.21/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6733.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_21_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/Add:Add*input:out_5F_23(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.21/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.21/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.21/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.21/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_21_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_21_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6734.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.21/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_21_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.21/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.21/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.21/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.21/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.21/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.21/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6735.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_21_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.21/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_21_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_24(1,77,1280) /te2/text_model/encoder/layers.22/layer_norm1/ReduceMean:ReduceMean*input:out_5F_24(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.22/layer_norm1/Sub:Sub*input:out_5F_24(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.22/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.22/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.22/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_22_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_22_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3125.bin(float32:1280,3840)*output:3126(1,77,3840) :Split*input:3126(1,77,3840);2976.bin(int64:3)*output:3127(1,77,1280);3128(1,77,1280);3129(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.22/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_22_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3127(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_22_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3128(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.22/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.22/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_22_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3129(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.22/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.22/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.22/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.22/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.22/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.22/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.22/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.22/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.22/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.22/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.22/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.22/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.22/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.22/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.22/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.22/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.22/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6784.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_22_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/Add:Add*input:out_5F_24(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.22/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.22/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.22/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.22/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_22_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_22_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6785.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.22/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_22_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.22/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.22/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.22/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.22/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.22/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.22/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6786.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_22_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.22/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_22_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_25(1,77,1280) /te2/text_model/encoder/layers.23/layer_norm1/ReduceMean:ReduceMean*input:out_5F_25(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.23/layer_norm1/Sub:Sub*input:out_5F_25(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.23/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.23/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.23/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_23_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_23_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3132.bin(float32:1280,3840)*output:3133(1,77,3840) :Split*input:3133(1,77,3840);2976.bin(int64:3)*output:3134(1,77,1280);3135(1,77,1280);3136(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.23/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_23_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3134(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_23_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3135(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.23/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.23/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_23_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3136(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.23/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.23/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.23/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.23/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.23/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.23/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.23/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.23/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.23/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.23/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.23/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.23/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.23/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.23/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.23/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.23/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.23/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6835.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_23_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/Add:Add*input:out_5F_25(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.23/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.23/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.23/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.23/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_23_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_23_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6836.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.23/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_23_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.23/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.23/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.23/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.23/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.23/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.23/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6837.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_23_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.23/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_23_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_26(1,77,1280) /te2/text_model/encoder/layers.24/layer_norm1/ReduceMean:ReduceMean*input:out_5F_26(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.24/layer_norm1/Sub:Sub*input:out_5F_26(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.24/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.24/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.24/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_24_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_24_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3139.bin(float32:1280,3840)*output:3140(1,77,3840) :Split*input:3140(1,77,3840);2976.bin(int64:3)*output:3141(1,77,1280);3142(1,77,1280);3143(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.24/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_24_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3141(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_24_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3142(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.24/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.24/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_24_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3143(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.24/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.24/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.24/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.24/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.24/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.24/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.24/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.24/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.24/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.24/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.24/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.24/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.24/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.24/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.24/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.24/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.24/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6886.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_24_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/Add:Add*input:out_5F_26(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.24/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.24/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.24/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.24/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_24_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_24_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6887.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.24/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_24_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.24/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.24/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.24/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.24/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.24/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.24/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6888.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_24_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.24/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_24_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_27(1,77,1280) /te2/text_model/encoder/layers.25/layer_norm1/ReduceMean:ReduceMean*input:out_5F_27(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.25/layer_norm1/Sub:Sub*input:out_5F_27(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.25/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.25/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.25/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_25_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_25_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3146.bin(float32:1280,3840)*output:3147(1,77,3840) :Split*input:3147(1,77,3840);2976.bin(int64:3)*output:3148(1,77,1280);3149(1,77,1280);3150(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.25/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_25_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3148(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_25_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3149(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.25/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.25/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_25_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3150(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.25/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.25/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.25/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.25/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.25/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.25/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.25/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.25/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.25/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.25/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.25/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.25/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.25/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.25/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.25/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.25/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.25/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6937.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_25_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/Add:Add*input:out_5F_27(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.25/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.25/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.25/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.25/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_25_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_25_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6938.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.25/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_25_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.25/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.25/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.25/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.25/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.25/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.25/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6939.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_25_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.25/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_25_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_28(1,77,1280) /te2/text_model/encoder/layers.26/layer_norm1/ReduceMean:ReduceMean*input:out_5F_28(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.26/layer_norm1/Sub:Sub*input:out_5F_28(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.26/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.26/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.26/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_26_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_26_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3153.bin(float32:1280,3840)*output:3154(1,77,3840) :Split*input:3154(1,77,3840);2976.bin(int64:3)*output:3155(1,77,1280);3156(1,77,1280);3157(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.26/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_26_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3155(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_26_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3156(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.26/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.26/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_26_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3157(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.26/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.26/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.26/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.26/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.26/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.26/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.26/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.26/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.26/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.26/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.26/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.26/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.26/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.26/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.26/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.26/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.26/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6988.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_26_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/Add:Add*input:out_5F_28(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.26/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.26/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.26/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.26/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_26_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_26_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_6989.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.26/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_26_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.26/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.26/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.26/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.26/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.26/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.26/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_6990.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_26_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.26/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_26_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_29(1,77,1280) /te2/text_model/encoder/layers.27/layer_norm1/ReduceMean:ReduceMean*input:out_5F_29(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.27/layer_norm1/Sub:Sub*input:out_5F_29(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.27/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.27/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.27/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_27_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_27_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3160.bin(float32:1280,3840)*output:3161(1,77,3840) :Split*input:3161(1,77,3840);2976.bin(int64:3)*output:3162(1,77,1280);3163(1,77,1280);3164(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.27/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_27_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3162(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_27_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3163(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.27/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.27/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_27_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3164(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.27/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.27/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.27/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.27/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.27/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.27/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.27/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.27/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.27/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.27/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.27/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.27/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.27/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.27/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.27/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.27/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.27/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_7039.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_27_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/Add:Add*input:out_5F_29(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.27/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.27/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.27/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.27/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_27_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_27_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_7040.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.27/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_27_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.27/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.27/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.27/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.27/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.27/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.27/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_7041.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_27_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.27/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_27_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_30(1,77,1280) /te2/text_model/encoder/layers.28/layer_norm1/ReduceMean:ReduceMean*input:out_5F_30(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.28/layer_norm1/Sub:Sub*input:out_5F_30(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.28/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.28/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.28/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_28_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_28_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3167.bin(float32:1280,3840)*output:3168(1,77,3840) :Split*input:3168(1,77,3840);2976.bin(int64:3)*output:3169(1,77,1280);3170(1,77,1280);3171(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.28/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_28_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3169(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_28_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3170(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.28/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.28/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_28_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3171(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.28/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.28/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.28/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.28/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.28/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.28/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.28/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.28/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.28/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.28/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.28/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.28/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.28/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.28/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.28/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.28/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.28/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_7090.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_28_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/Add:Add*input:out_5F_30(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.28/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.28/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.28/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.28/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_28_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_28_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_7091.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.28/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_28_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.28/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.28/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.28/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.28/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.28/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.28/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_7092.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_28_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.28/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_28_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_31(1,77,1280) /te2/text_model/encoder/layers.29/layer_norm1/ReduceMean:ReduceMean*input:out_5F_31(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.29/layer_norm1/Sub:Sub*input:out_5F_31(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.29/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.29/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.29/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_29_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_29_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3174.bin(float32:1280,3840)*output:3175(1,77,3840) :Split*input:3175(1,77,3840);2976.bin(int64:3)*output:3176(1,77,1280);3177(1,77,1280);3178(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.29/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_29_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3176(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_29_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3177(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.29/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.29/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_29_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3178(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.29/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.29/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.29/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.29/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.29/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.29/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.29/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.29/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.29/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.29/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.29/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.29/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.29/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.29/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.29/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.29/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.29/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_7141.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_29_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/Add:Add*input:out_5F_31(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.29/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.29/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.29/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.29/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_29_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_29_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_7142.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.29/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_29_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.29/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.29/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.29/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.29/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.29/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.29/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_7143.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_29_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.29/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_29_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_32(1,77,1280) /te2/text_model/encoder/layers.30/layer_norm1/ReduceMean:ReduceMean*input:out_5F_32(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.30/layer_norm1/Sub:Sub*input:out_5F_32(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.30/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.30/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.30/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_30_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_30_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3181.bin(float32:1280,3840)*output:3182(1,77,3840) :Split*input:3182(1,77,3840);2976.bin(int64:3)*output:3183(1,77,1280);3184(1,77,1280);3185(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.30/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_30_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3183(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_30_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3184(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.30/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.30/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_30_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3185(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.30/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.30/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.30/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.30/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.30/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.30/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.30/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.30/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.30/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.30/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.30/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.30/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.30/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.30/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.30/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.30/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.30/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_7192.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_30_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/Add:Add*input:out_5F_32(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.30/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.30/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.30/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.30/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_30_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_30_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_7193.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.30/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_30_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.30/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.30/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.30/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.30/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.30/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.30/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_7194.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_30_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.30/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_30_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_33(1,77,1280) /te2/text_model/encoder/layers.31/layer_norm1/ReduceMean:ReduceMean*input:out_5F_33(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.31/layer_norm1/Sub:Sub*input:out_5F_33(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/layer_norm1/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/layer_norm1/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.31/layer_norm1/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.31/layer_norm1/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.31/layer_norm1/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/layer_norm1/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_31_2E_layer_5F_norm1_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/layer_norm1/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_31_2E_layer_5F_norm1_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280) :MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm1_2F_Add_5F_1_5F_output_5F_0(1,77,1280);3188.bin(float32:1280,3840)*output:3189(1,77,3840) :Split*input:3189(1,77,3840);2976.bin(int64:3)*output:3190(1,77,1280);3191(1,77,1280);3192(1,77,1280)*axis:-1 /te2/text_model/encoder/layers.31/self_attn/q_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_31_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:1280);3190(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/self_attn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_q_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/self_attn/k_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_31_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:1280);3191(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/self_attn/Reshape:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_k_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.31/self_attn/Transpose:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.31/self_attn/v_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_31_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:1280);3192(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/self_attn/Reshape_1:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_v_5F_proj_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_1_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.31/self_attn/Transpose_1:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.31/self_attn/Reshape_2:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Mul_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*allowzero:0 /te2/text_model/encoder/layers.31/self_attn/Transpose_2:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,77,20,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.31/self_attn/Reshape_3:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.31/self_attn/Reshape_4:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.31/self_attn/Reshape_5:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*allowzero:0 /te2/text_model/encoder/layers.31/self_attn/Transpose_3:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*perm:0,2,1 /te2/text_model/encoder/layers.31/self_attn/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_3_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(20,64,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77) /te2/text_model/encoder/layers.31/self_attn/Reshape_6:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_MatMul_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_7_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77)*allowzero:0 /te2/text_model/encoder/layers.31/self_attn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_Expand_5F_output_5F_0.bin(float32:1,1,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77) /te2/text_model/encoder/layers.31/self_attn/Reshape_7:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Add_5F_output_5F_0(1,20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_8_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*allowzero:0 /te2/text_model/encoder/layers.31/self_attn/Softmax:Softmax*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(20,77,77)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77)*axis:-1 /te2/text_model/encoder/layers.31/self_attn/MatMul_1:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Softmax_5F_output_5F_0(20,77,77);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_5_5F_output_5F_0(20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64) /te2/text_model/encoder/layers.31/self_attn/Reshape_8:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0(20,77,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_9_5F_output_5F_0.bin(int64:4)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*allowzero:0 /te2/text_model/encoder/layers.31/self_attn/Transpose_4:Transpose*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_8_5F_output_5F_0(1,20,77,64)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64)*perm:0,2,1,3 /te2/text_model/encoder/layers.31/self_attn/Reshape_9:Reshape*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0(1,77,20,64);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_10_5F_output_5F_0.bin(int64:3)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280)*allowzero:0 /te2/text_model/encoder/layers.31/self_attn/out_proj/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_9_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_7243.bin(float32:1280,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/self_attn/out_proj/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_31_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_out_5F_proj_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/Add:Add*input:out_5F_33(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_self_5F_attn_2F_out_5F_proj_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/layer_norm2/ReduceMean:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_Add_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.31/layer_norm2/Sub:Sub*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/layer_norm2/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/layer_norm2/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/encoder/layers.31/layer_norm2/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.31/layer_norm2/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/encoder/layers.31/layer_norm2/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/layer_norm2/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_31_2E_layer_5F_norm2_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/layer_norm2/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_encoder_2E_layers_2E_31_2E_layer_5F_norm2_2E_bias.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/mlp/fc1/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_layer_5F_norm2_2F_Add_5F_1_5F_output_5F_0(1,77,1280);onnx_3A__3A_MatMul_5F_7244.bin(float32:1280,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.31/mlp/fc1/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_31_2E_mlp_2E_fc1_2E_bias.bin(float32:5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_fc1_2F_MatMul_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.31/mlp/activation_fn/Div:Div*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.31/mlp/activation_fn/Erf:Erf*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_activation_5F_fn_2F_Div_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.31/mlp/activation_fn/Add:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_activation_5F_fn_2F_Erf_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.31/mlp/activation_fn/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_fc1_2F_Add_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_activation_5F_fn_2F_Add_5F_output_5F_0(1,77,5120)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.31/mlp/activation_fn/Mul_1:Mul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_output_5F_0(1,77,5120);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_mlp_2F_activation_5F_fn_2F_Constant_5F_2_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120) /te2/text_model/encoder/layers.31/mlp/fc2/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_activation_5F_fn_2F_Mul_5F_1_5F_output_5F_0(1,77,5120);onnx_3A__3A_MatMul_5F_7245.bin(float32:5120,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/mlp/fc2/Add:Add*input:te2_2E_text_5F_model_2E_encoder_2E_layers_2E_31_2E_mlp_2E_fc2_2E_bias.bin(float32:1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_fc2_2F_MatMul_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280) /te2/text_model/encoder/layers.31/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_Add_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_31_2F_mlp_2F_fc2_2F_Add_5F_output_5F_0(1,77,1280)*output:out_5F_34(1,77,1280) /te2/text_model/final_layer_norm/ReduceMean:ReduceMean*input:out_5F_34(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_ReduceMean_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/final_layer_norm/Sub:Sub*input:out_5F_34(1,77,1280);_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_ReduceMean_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_Sub_5F_output_5F_0(1,77,1280) /te2/text_model/final_layer_norm/Pow:Pow*input:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_Pow_5F_output_5F_0(1,77,1280) /te2/text_model/final_layer_norm/ReduceMean_1:ReduceMean*input:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_Pow_5F_output_5F_0(1,77,1280)*output:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1)*axes:-1 /te2/text_model/final_layer_norm/Add:Add*input:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_ReduceMean_5F_1_5F_output_5F_0(1,77,1);_2F_te2_2F_text_5F_model_2F_encoder_2F_layers_2E_0_2F_layer_5F_norm1_2F_Constant_5F_1_5F_output_5F_0.bin(float32:)*output:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_Add_5F_output_5F_0(1,77,1) /te2/text_model/final_layer_norm/Sqrt:Sqrt*input:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_Add_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_Sqrt_5F_output_5F_0(1,77,1) /te2/text_model/final_layer_norm/Div:Div*input:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_Sub_5F_output_5F_0(1,77,1280);_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_Sqrt_5F_output_5F_0(1,77,1)*output:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_Div_5F_output_5F_0(1,77,1280) /te2/text_model/final_layer_norm/Mul:Mul*input:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_Div_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_final_5F_layer_5F_norm_2E_weight.bin(float32:1280)*output:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_Mul_5F_output_5F_0(1,77,1280) /te2/text_model/final_layer_norm/Add_1:Add*input:_2F_te2_2F_text_5F_model_2F_final_5F_layer_5F_norm_2F_Mul_5F_output_5F_0(1,77,1280);te2_2E_text_5F_model_2E_final_5F_layer_5F_norm_2E_bias.bin(float32:1280)*output:out_5F_1(1,77,1280) /te2/text_model/ArgMax:ArgMax*input:input_5F_ids(1,77)*output:_2F_te2_2F_text_5F_model_2F_ArgMax_5F_output_5F_0(1)*axis:-1;keepdims:0;select_last_index:0 /te2/text_model/Reshape:Reshape*input:out_5F_1(1,77,1280);out_5F_1_5F_Reshape.bin(int64:2)*output:_2F_te2_2F_text_5F_model_2F_Flatten_5F_output_5F_0(77,1280)*allowzero:0 /te2/text_model/Gather_2:Gather*input:_2F_te2_2F_text_5F_model_2F_Flatten_5F_output_5F_0(77,1280);_2F_te2_2F_text_5F_model_2F_ArgMax_5F_output_5F_0(1)*output:_2F_te2_2F_text_5F_model_2F_Gather_5F_2_5F_output_5F_0(1,1280) /te2/text_projection/MatMul:MatMul*input:_2F_te2_2F_text_5F_model_2F_Gather_5F_2_5F_output_5F_0(1,1280);onnx_3A__3A_MatMul_5F_7246.bin(float32:1280,1280)*output:out_5F_0(1,1280)