Androidonnxfork's picture
Upload folder using huggingface_hub
e82443b
raw
history blame contribute delete
No virus
95.6 kB
Reshape_113:Reshape*input:onnx_3A__3A_Reshape_5F_0(1,77);onnx_3A__3A_Reshape_5F_2274.bin(int64:2)*output:input(1,77)*allowzero:0
Gather_114:Gather*input:text_5F_model_2E_embeddings_2E_token_5F_embedding_2E_wrapped_2E_weight.bin(float32:49408,768);input(1,77)*output:onnx_3A__3A_Add_5F_212(1,77,768)
Add_116:Add*input:onnx_3A__3A_Add_5F_212(1,77,768);onnx_3A__3A_Add_5F_213.bin(float32:1,77,768)*output:input_2E_7(1,77,768)
ReduceMean_123:ReduceMean*input:input_2E_7(1,77,768)*output:onnx_3A__3A_Sub_5F_221(1,77,1)*axes:-1
Sub_124:Sub*input:input_2E_7(1,77,768);onnx_3A__3A_Sub_5F_221(1,77,1)*output:onnx_3A__3A_Pow_5F_222(1,77,768)
Pow_126:Pow*input:onnx_3A__3A_Pow_5F_222(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_224(1,77,768)
ReduceMean_127:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_224(1,77,768)*output:onnx_3A__3A_Add_5F_225(1,77,1)*axes:-1
Add_129:Add*input:onnx_3A__3A_Add_5F_225(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_227(1,77,1)
Sqrt_130:Sqrt*input:onnx_3A__3A_Sqrt_5F_227(1,77,1)*output:onnx_3A__3A_Div_5F_228(1,77,1)
Div_131:Div*input:onnx_3A__3A_Pow_5F_222(1,77,768);onnx_3A__3A_Div_5F_228(1,77,1)*output:onnx_3A__3A_Mul_5F_229(1,77,768)
Mul_132:Mul*input:onnx_3A__3A_Mul_5F_229(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_230(1,77,768)
Add_133:Add*input:onnx_3A__3A_Add_5F_230(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_231(1,77,768)
MatMul_134:MatMul*input:onnx_3A__3A_MatMul_5F_231(1,77,768);onnx_3A__3A_MatMul_5F_2276.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_236(1,77,768)
Add_135:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_236(1,77,768)*output:onnx_3A__3A_Mul_5F_237(1,77,768)
Mul_137:Mul*input:onnx_3A__3A_Mul_5F_237(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states(1,77,768)
MatMul_138:MatMul*input:onnx_3A__3A_MatMul_5F_231(1,77,768);onnx_3A__3A_MatMul_5F_2277.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_241(1,77,768)
Add_139:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_241(1,77,768)*output:onnx_3A__3A_Reshape_5F_242(1,77,768)
Reshape_140:Reshape*input:onnx_3A__3A_Reshape_5F_242(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_255(1,77,12,64)*allowzero:0
Transpose_141:Transpose*input:onnx_3A__3A_Transpose_5F_255(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_256(1,12,77,64)*perm:0,2,1,3
MatMul_142:MatMul*input:onnx_3A__3A_MatMul_5F_231(1,77,768);onnx_3A__3A_MatMul_5F_2283.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_258(1,77,768)
Add_143:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_258(1,77,768)*output:onnx_3A__3A_Reshape_5F_259(1,77,768)
Reshape_144:Reshape*input:onnx_3A__3A_Reshape_5F_259(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_272(1,77,12,64)*allowzero:0
Transpose_145:Transpose*input:onnx_3A__3A_Transpose_5F_272(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_273(1,12,77,64)*perm:0,2,1,3
Reshape_146:Reshape*input:query_5F_states(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_286(1,77,12,64)*allowzero:0
Transpose_147:Transpose*input:onnx_3A__3A_Transpose_5F_286(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_287(1,12,77,64)*perm:0,2,1,3
Reshape_148:Reshape*input:onnx_3A__3A_Reshape_5F_287(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_297(12,77,64)*allowzero:0
Reshape_149:Reshape*input:onnx_3A__3A_Reshape_5F_256(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_307(12,77,64)*allowzero:0
Reshape_150:Reshape*input:onnx_3A__3A_Reshape_5F_273(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_317(12,77,64)*allowzero:0
Transpose_151:Transpose*input:onnx_3A__3A_Transpose_5F_307(12,77,64)*output:onnx_3A__3A_MatMul_5F_319(12,64,77)*perm:0,2,1
MatMul_152:MatMul*input:onnx_3A__3A_MatMul_5F_297(12,77,64);onnx_3A__3A_MatMul_5F_319(12,64,77)*output:onnx_3A__3A_Reshape_5F_320(12,77,77)
Reshape_153:Reshape*input:onnx_3A__3A_Reshape_5F_320(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_331(1,12,77,77)*allowzero:0
Add_154:Add*input:onnx_3A__3A_Add_5F_331(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_332(1,12,77,77)
Reshape_155:Reshape*input:onnx_3A__3A_Reshape_5F_332(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights(12,77,77)*allowzero:0
Softmax_156:Softmax*input:attn_5F_weights(12,77,77)*output:attn_5F_weights_2E_3(12,77,77)*axis:-1
MatMul_157:MatMul*input:attn_5F_weights_2E_3(12,77,77);onnx_3A__3A_MatMul_5F_317(12,77,64)*output:onnx_3A__3A_Reshape_5F_343(12,77,64)
Reshape_158:Reshape*input:onnx_3A__3A_Reshape_5F_343(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_355(1,12,77,64)*allowzero:0
Transpose_159:Transpose*input:onnx_3A__3A_Transpose_5F_355(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_356(1,77,12,64)*perm:0,2,1,3
Reshape_160:Reshape*input:onnx_3A__3A_Reshape_5F_356(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_364(1,77,768)*allowzero:0
MatMul_161:MatMul*input:onnx_3A__3A_MatMul_5F_364(1,77,768);onnx_3A__3A_MatMul_5F_2324.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_366(1,77,768)
Add_162:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_366(1,77,768)*output:onnx_3A__3A_Add_5F_367(1,77,768)
Add_163:Add*input:input_2E_7(1,77,768);onnx_3A__3A_Add_5F_367(1,77,768)*output:input_2E_11(1,77,768)
ReduceMean_164:ReduceMean*input:input_2E_11(1,77,768)*output:onnx_3A__3A_Sub_5F_369(1,77,1)*axes:-1
Sub_165:Sub*input:input_2E_11(1,77,768);onnx_3A__3A_Sub_5F_369(1,77,1)*output:onnx_3A__3A_Pow_5F_370(1,77,768)
Pow_167:Pow*input:onnx_3A__3A_Pow_5F_370(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_372(1,77,768)
ReduceMean_168:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_372(1,77,768)*output:onnx_3A__3A_Add_5F_373(1,77,1)*axes:-1
Add_170:Add*input:onnx_3A__3A_Add_5F_373(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_375(1,77,1)
Sqrt_171:Sqrt*input:onnx_3A__3A_Sqrt_5F_375(1,77,1)*output:onnx_3A__3A_Div_5F_376(1,77,1)
Div_172:Div*input:onnx_3A__3A_Pow_5F_370(1,77,768);onnx_3A__3A_Div_5F_376(1,77,1)*output:onnx_3A__3A_Mul_5F_377(1,77,768)
Mul_173:Mul*input:onnx_3A__3A_Mul_5F_377(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_378(1,77,768)
Add_174:Add*input:onnx_3A__3A_Add_5F_378(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_379(1,77,768)
MatMul_175:MatMul*input:onnx_3A__3A_MatMul_5F_379(1,77,768);onnx_3A__3A_MatMul_5F_2325.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_381(1,77,3072)
Add_176:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_381(1,77,3072)*output:onnx_3A__3A_Mul_5F_382(1,77,3072)
Mul_178:Mul*input:onnx_3A__3A_Mul_5F_382(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_384(1,77,3072)
Sigmoid_179:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_384(1,77,3072)*output:onnx_3A__3A_Mul_5F_385(1,77,3072)
Mul_180:Mul*input:onnx_3A__3A_Mul_5F_382(1,77,3072);onnx_3A__3A_Mul_5F_385(1,77,3072)*output:onnx_3A__3A_MatMul_5F_386(1,77,3072)
MatMul_181:MatMul*input:onnx_3A__3A_MatMul_5F_386(1,77,3072);onnx_3A__3A_MatMul_5F_2326.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_388(1,77,768)
Add_182:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_388(1,77,768)*output:onnx_3A__3A_Add_5F_389(1,77,768)
Add_183:Add*input:input_2E_11(1,77,768);onnx_3A__3A_Add_5F_389(1,77,768)*output:input_2E_15(1,77,768)
ReduceMean_184:ReduceMean*input:input_2E_15(1,77,768)*output:onnx_3A__3A_Sub_5F_391(1,77,1)*axes:-1
Sub_185:Sub*input:input_2E_15(1,77,768);onnx_3A__3A_Sub_5F_391(1,77,1)*output:onnx_3A__3A_Pow_5F_392(1,77,768)
Pow_187:Pow*input:onnx_3A__3A_Pow_5F_392(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_394(1,77,768)
ReduceMean_188:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_394(1,77,768)*output:onnx_3A__3A_Add_5F_395(1,77,1)*axes:-1
Add_190:Add*input:onnx_3A__3A_Add_5F_395(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_397(1,77,1)
Sqrt_191:Sqrt*input:onnx_3A__3A_Sqrt_5F_397(1,77,1)*output:onnx_3A__3A_Div_5F_398(1,77,1)
Div_192:Div*input:onnx_3A__3A_Pow_5F_392(1,77,768);onnx_3A__3A_Div_5F_398(1,77,1)*output:onnx_3A__3A_Mul_5F_399(1,77,768)
Mul_193:Mul*input:onnx_3A__3A_Mul_5F_399(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_400(1,77,768)
Add_194:Add*input:onnx_3A__3A_Add_5F_400(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_401(1,77,768)
MatMul_195:MatMul*input:onnx_3A__3A_MatMul_5F_401(1,77,768);onnx_3A__3A_MatMul_5F_2327.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_406(1,77,768)
Add_196:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_406(1,77,768)*output:onnx_3A__3A_Mul_5F_407(1,77,768)
Mul_198:Mul*input:onnx_3A__3A_Mul_5F_407(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_3(1,77,768)
MatMul_199:MatMul*input:onnx_3A__3A_MatMul_5F_401(1,77,768);onnx_3A__3A_MatMul_5F_2328.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_411(1,77,768)
Add_200:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_411(1,77,768)*output:onnx_3A__3A_Reshape_5F_412(1,77,768)
Reshape_201:Reshape*input:onnx_3A__3A_Reshape_5F_412(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_425(1,77,12,64)*allowzero:0
Transpose_202:Transpose*input:onnx_3A__3A_Transpose_5F_425(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_426(1,12,77,64)*perm:0,2,1,3
MatMul_203:MatMul*input:onnx_3A__3A_MatMul_5F_401(1,77,768);onnx_3A__3A_MatMul_5F_2334.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_428(1,77,768)
Add_204:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_428(1,77,768)*output:onnx_3A__3A_Reshape_5F_429(1,77,768)
Reshape_205:Reshape*input:onnx_3A__3A_Reshape_5F_429(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_442(1,77,12,64)*allowzero:0
Transpose_206:Transpose*input:onnx_3A__3A_Transpose_5F_442(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_443(1,12,77,64)*perm:0,2,1,3
Reshape_207:Reshape*input:query_5F_states_2E_3(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_456(1,77,12,64)*allowzero:0
Transpose_208:Transpose*input:onnx_3A__3A_Transpose_5F_456(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_457(1,12,77,64)*perm:0,2,1,3
Reshape_209:Reshape*input:onnx_3A__3A_Reshape_5F_457(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_467(12,77,64)*allowzero:0
Reshape_210:Reshape*input:onnx_3A__3A_Reshape_5F_426(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_477(12,77,64)*allowzero:0
Reshape_211:Reshape*input:onnx_3A__3A_Reshape_5F_443(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_487(12,77,64)*allowzero:0
Transpose_212:Transpose*input:onnx_3A__3A_Transpose_5F_477(12,77,64)*output:onnx_3A__3A_MatMul_5F_489(12,64,77)*perm:0,2,1
MatMul_213:MatMul*input:onnx_3A__3A_MatMul_5F_467(12,77,64);onnx_3A__3A_MatMul_5F_489(12,64,77)*output:onnx_3A__3A_Reshape_5F_490(12,77,77)
Reshape_214:Reshape*input:onnx_3A__3A_Reshape_5F_490(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_501(1,12,77,77)*allowzero:0
Add_215:Add*input:onnx_3A__3A_Add_5F_501(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_502(1,12,77,77)
Reshape_216:Reshape*input:onnx_3A__3A_Reshape_5F_502(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_7(12,77,77)*allowzero:0
Softmax_217:Softmax*input:attn_5F_weights_2E_7(12,77,77)*output:attn_5F_weights_2E_11(12,77,77)*axis:-1
MatMul_218:MatMul*input:attn_5F_weights_2E_11(12,77,77);onnx_3A__3A_MatMul_5F_487(12,77,64)*output:onnx_3A__3A_Reshape_5F_513(12,77,64)
Reshape_219:Reshape*input:onnx_3A__3A_Reshape_5F_513(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_525(1,12,77,64)*allowzero:0
Transpose_220:Transpose*input:onnx_3A__3A_Transpose_5F_525(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_526(1,77,12,64)*perm:0,2,1,3
Reshape_221:Reshape*input:onnx_3A__3A_Reshape_5F_526(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_534(1,77,768)*allowzero:0
MatMul_222:MatMul*input:onnx_3A__3A_MatMul_5F_534(1,77,768);onnx_3A__3A_MatMul_5F_2375.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_536(1,77,768)
Add_223:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_536(1,77,768)*output:onnx_3A__3A_Add_5F_537(1,77,768)
Add_224:Add*input:input_2E_15(1,77,768);onnx_3A__3A_Add_5F_537(1,77,768)*output:input_2E_19(1,77,768)
ReduceMean_225:ReduceMean*input:input_2E_19(1,77,768)*output:onnx_3A__3A_Sub_5F_539(1,77,1)*axes:-1
Sub_226:Sub*input:input_2E_19(1,77,768);onnx_3A__3A_Sub_5F_539(1,77,1)*output:onnx_3A__3A_Pow_5F_540(1,77,768)
Pow_228:Pow*input:onnx_3A__3A_Pow_5F_540(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_542(1,77,768)
ReduceMean_229:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_542(1,77,768)*output:onnx_3A__3A_Add_5F_543(1,77,1)*axes:-1
Add_231:Add*input:onnx_3A__3A_Add_5F_543(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_545(1,77,1)
Sqrt_232:Sqrt*input:onnx_3A__3A_Sqrt_5F_545(1,77,1)*output:onnx_3A__3A_Div_5F_546(1,77,1)
Div_233:Div*input:onnx_3A__3A_Pow_5F_540(1,77,768);onnx_3A__3A_Div_5F_546(1,77,1)*output:onnx_3A__3A_Mul_5F_547(1,77,768)
Mul_234:Mul*input:onnx_3A__3A_Mul_5F_547(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_548(1,77,768)
Add_235:Add*input:onnx_3A__3A_Add_5F_548(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_549(1,77,768)
MatMul_236:MatMul*input:onnx_3A__3A_MatMul_5F_549(1,77,768);onnx_3A__3A_MatMul_5F_2376.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_551(1,77,3072)
Add_237:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_551(1,77,3072)*output:onnx_3A__3A_Mul_5F_552(1,77,3072)
Mul_239:Mul*input:onnx_3A__3A_Mul_5F_552(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_554(1,77,3072)
Sigmoid_240:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_554(1,77,3072)*output:onnx_3A__3A_Mul_5F_555(1,77,3072)
Mul_241:Mul*input:onnx_3A__3A_Mul_5F_552(1,77,3072);onnx_3A__3A_Mul_5F_555(1,77,3072)*output:onnx_3A__3A_MatMul_5F_556(1,77,3072)
MatMul_242:MatMul*input:onnx_3A__3A_MatMul_5F_556(1,77,3072);onnx_3A__3A_MatMul_5F_2377.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_558(1,77,768)
Add_243:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_558(1,77,768)*output:onnx_3A__3A_Add_5F_559(1,77,768)
Add_244:Add*input:input_2E_19(1,77,768);onnx_3A__3A_Add_5F_559(1,77,768)*output:input_2E_23(1,77,768)
ReduceMean_245:ReduceMean*input:input_2E_23(1,77,768)*output:onnx_3A__3A_Sub_5F_561(1,77,1)*axes:-1
Sub_246:Sub*input:input_2E_23(1,77,768);onnx_3A__3A_Sub_5F_561(1,77,1)*output:onnx_3A__3A_Pow_5F_562(1,77,768)
Pow_248:Pow*input:onnx_3A__3A_Pow_5F_562(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_564(1,77,768)
ReduceMean_249:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_564(1,77,768)*output:onnx_3A__3A_Add_5F_565(1,77,1)*axes:-1
Add_251:Add*input:onnx_3A__3A_Add_5F_565(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_567(1,77,1)
Sqrt_252:Sqrt*input:onnx_3A__3A_Sqrt_5F_567(1,77,1)*output:onnx_3A__3A_Div_5F_568(1,77,1)
Div_253:Div*input:onnx_3A__3A_Pow_5F_562(1,77,768);onnx_3A__3A_Div_5F_568(1,77,1)*output:onnx_3A__3A_Mul_5F_569(1,77,768)
Mul_254:Mul*input:onnx_3A__3A_Mul_5F_569(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_570(1,77,768)
Add_255:Add*input:onnx_3A__3A_Add_5F_570(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_571(1,77,768)
MatMul_256:MatMul*input:onnx_3A__3A_MatMul_5F_571(1,77,768);onnx_3A__3A_MatMul_5F_2378.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_576(1,77,768)
Add_257:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_576(1,77,768)*output:onnx_3A__3A_Mul_5F_577(1,77,768)
Mul_259:Mul*input:onnx_3A__3A_Mul_5F_577(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_7(1,77,768)
MatMul_260:MatMul*input:onnx_3A__3A_MatMul_5F_571(1,77,768);onnx_3A__3A_MatMul_5F_2379.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_581(1,77,768)
Add_261:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_581(1,77,768)*output:onnx_3A__3A_Reshape_5F_582(1,77,768)
Reshape_262:Reshape*input:onnx_3A__3A_Reshape_5F_582(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_595(1,77,12,64)*allowzero:0
Transpose_263:Transpose*input:onnx_3A__3A_Transpose_5F_595(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_596(1,12,77,64)*perm:0,2,1,3
MatMul_264:MatMul*input:onnx_3A__3A_MatMul_5F_571(1,77,768);onnx_3A__3A_MatMul_5F_2385.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_598(1,77,768)
Add_265:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_598(1,77,768)*output:onnx_3A__3A_Reshape_5F_599(1,77,768)
Reshape_266:Reshape*input:onnx_3A__3A_Reshape_5F_599(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_612(1,77,12,64)*allowzero:0
Transpose_267:Transpose*input:onnx_3A__3A_Transpose_5F_612(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_613(1,12,77,64)*perm:0,2,1,3
Reshape_268:Reshape*input:query_5F_states_2E_7(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_626(1,77,12,64)*allowzero:0
Transpose_269:Transpose*input:onnx_3A__3A_Transpose_5F_626(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_627(1,12,77,64)*perm:0,2,1,3
Reshape_270:Reshape*input:onnx_3A__3A_Reshape_5F_627(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_637(12,77,64)*allowzero:0
Reshape_271:Reshape*input:onnx_3A__3A_Reshape_5F_596(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_647(12,77,64)*allowzero:0
Reshape_272:Reshape*input:onnx_3A__3A_Reshape_5F_613(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_657(12,77,64)*allowzero:0
Transpose_273:Transpose*input:onnx_3A__3A_Transpose_5F_647(12,77,64)*output:onnx_3A__3A_MatMul_5F_659(12,64,77)*perm:0,2,1
MatMul_274:MatMul*input:onnx_3A__3A_MatMul_5F_637(12,77,64);onnx_3A__3A_MatMul_5F_659(12,64,77)*output:onnx_3A__3A_Reshape_5F_660(12,77,77)
Reshape_275:Reshape*input:onnx_3A__3A_Reshape_5F_660(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_671(1,12,77,77)*allowzero:0
Add_276:Add*input:onnx_3A__3A_Add_5F_671(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_672(1,12,77,77)
Reshape_277:Reshape*input:onnx_3A__3A_Reshape_5F_672(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_15(12,77,77)*allowzero:0
Softmax_278:Softmax*input:attn_5F_weights_2E_15(12,77,77)*output:attn_5F_weights_2E_19(12,77,77)*axis:-1
MatMul_279:MatMul*input:attn_5F_weights_2E_19(12,77,77);onnx_3A__3A_MatMul_5F_657(12,77,64)*output:onnx_3A__3A_Reshape_5F_683(12,77,64)
Reshape_280:Reshape*input:onnx_3A__3A_Reshape_5F_683(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_695(1,12,77,64)*allowzero:0
Transpose_281:Transpose*input:onnx_3A__3A_Transpose_5F_695(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_696(1,77,12,64)*perm:0,2,1,3
Reshape_282:Reshape*input:onnx_3A__3A_Reshape_5F_696(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_704(1,77,768)*allowzero:0
MatMul_283:MatMul*input:onnx_3A__3A_MatMul_5F_704(1,77,768);onnx_3A__3A_MatMul_5F_2426.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_706(1,77,768)
Add_284:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_706(1,77,768)*output:onnx_3A__3A_Add_5F_707(1,77,768)
Add_285:Add*input:input_2E_23(1,77,768);onnx_3A__3A_Add_5F_707(1,77,768)*output:input_2E_27(1,77,768)
ReduceMean_286:ReduceMean*input:input_2E_27(1,77,768)*output:onnx_3A__3A_Sub_5F_709(1,77,1)*axes:-1
Sub_287:Sub*input:input_2E_27(1,77,768);onnx_3A__3A_Sub_5F_709(1,77,1)*output:onnx_3A__3A_Pow_5F_710(1,77,768)
Pow_289:Pow*input:onnx_3A__3A_Pow_5F_710(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_712(1,77,768)
ReduceMean_290:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_712(1,77,768)*output:onnx_3A__3A_Add_5F_713(1,77,1)*axes:-1
Add_292:Add*input:onnx_3A__3A_Add_5F_713(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_715(1,77,1)
Sqrt_293:Sqrt*input:onnx_3A__3A_Sqrt_5F_715(1,77,1)*output:onnx_3A__3A_Div_5F_716(1,77,1)
Div_294:Div*input:onnx_3A__3A_Pow_5F_710(1,77,768);onnx_3A__3A_Div_5F_716(1,77,1)*output:onnx_3A__3A_Mul_5F_717(1,77,768)
Mul_295:Mul*input:onnx_3A__3A_Mul_5F_717(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_718(1,77,768)
Add_296:Add*input:onnx_3A__3A_Add_5F_718(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_719(1,77,768)
MatMul_297:MatMul*input:onnx_3A__3A_MatMul_5F_719(1,77,768);onnx_3A__3A_MatMul_5F_2427.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_721(1,77,3072)
Add_298:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_721(1,77,3072)*output:onnx_3A__3A_Mul_5F_722(1,77,3072)
Mul_300:Mul*input:onnx_3A__3A_Mul_5F_722(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_724(1,77,3072)
Sigmoid_301:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_724(1,77,3072)*output:onnx_3A__3A_Mul_5F_725(1,77,3072)
Mul_302:Mul*input:onnx_3A__3A_Mul_5F_722(1,77,3072);onnx_3A__3A_Mul_5F_725(1,77,3072)*output:onnx_3A__3A_MatMul_5F_726(1,77,3072)
MatMul_303:MatMul*input:onnx_3A__3A_MatMul_5F_726(1,77,3072);onnx_3A__3A_MatMul_5F_2428.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_728(1,77,768)
Add_304:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_728(1,77,768)*output:onnx_3A__3A_Add_5F_729(1,77,768)
Add_305:Add*input:input_2E_27(1,77,768);onnx_3A__3A_Add_5F_729(1,77,768)*output:input_2E_31(1,77,768)
ReduceMean_306:ReduceMean*input:input_2E_31(1,77,768)*output:onnx_3A__3A_Sub_5F_731(1,77,1)*axes:-1
Sub_307:Sub*input:input_2E_31(1,77,768);onnx_3A__3A_Sub_5F_731(1,77,1)*output:onnx_3A__3A_Pow_5F_732(1,77,768)
Pow_309:Pow*input:onnx_3A__3A_Pow_5F_732(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_734(1,77,768)
ReduceMean_310:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_734(1,77,768)*output:onnx_3A__3A_Add_5F_735(1,77,1)*axes:-1
Add_312:Add*input:onnx_3A__3A_Add_5F_735(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_737(1,77,1)
Sqrt_313:Sqrt*input:onnx_3A__3A_Sqrt_5F_737(1,77,1)*output:onnx_3A__3A_Div_5F_738(1,77,1)
Div_314:Div*input:onnx_3A__3A_Pow_5F_732(1,77,768);onnx_3A__3A_Div_5F_738(1,77,1)*output:onnx_3A__3A_Mul_5F_739(1,77,768)
Mul_315:Mul*input:onnx_3A__3A_Mul_5F_739(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_740(1,77,768)
Add_316:Add*input:onnx_3A__3A_Add_5F_740(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_741(1,77,768)
MatMul_317:MatMul*input:onnx_3A__3A_MatMul_5F_741(1,77,768);onnx_3A__3A_MatMul_5F_2429.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_746(1,77,768)
Add_318:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_746(1,77,768)*output:onnx_3A__3A_Mul_5F_747(1,77,768)
Mul_320:Mul*input:onnx_3A__3A_Mul_5F_747(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_11(1,77,768)
MatMul_321:MatMul*input:onnx_3A__3A_MatMul_5F_741(1,77,768);onnx_3A__3A_MatMul_5F_2430.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_751(1,77,768)
Add_322:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_751(1,77,768)*output:onnx_3A__3A_Reshape_5F_752(1,77,768)
Reshape_323:Reshape*input:onnx_3A__3A_Reshape_5F_752(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_765(1,77,12,64)*allowzero:0
Transpose_324:Transpose*input:onnx_3A__3A_Transpose_5F_765(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_766(1,12,77,64)*perm:0,2,1,3
MatMul_325:MatMul*input:onnx_3A__3A_MatMul_5F_741(1,77,768);onnx_3A__3A_MatMul_5F_2436.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_768(1,77,768)
Add_326:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_768(1,77,768)*output:onnx_3A__3A_Reshape_5F_769(1,77,768)
Reshape_327:Reshape*input:onnx_3A__3A_Reshape_5F_769(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_782(1,77,12,64)*allowzero:0
Transpose_328:Transpose*input:onnx_3A__3A_Transpose_5F_782(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_783(1,12,77,64)*perm:0,2,1,3
Reshape_329:Reshape*input:query_5F_states_2E_11(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_796(1,77,12,64)*allowzero:0
Transpose_330:Transpose*input:onnx_3A__3A_Transpose_5F_796(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_797(1,12,77,64)*perm:0,2,1,3
Reshape_331:Reshape*input:onnx_3A__3A_Reshape_5F_797(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_807(12,77,64)*allowzero:0
Reshape_332:Reshape*input:onnx_3A__3A_Reshape_5F_766(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_817(12,77,64)*allowzero:0
Reshape_333:Reshape*input:onnx_3A__3A_Reshape_5F_783(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_827(12,77,64)*allowzero:0
Transpose_334:Transpose*input:onnx_3A__3A_Transpose_5F_817(12,77,64)*output:onnx_3A__3A_MatMul_5F_829(12,64,77)*perm:0,2,1
MatMul_335:MatMul*input:onnx_3A__3A_MatMul_5F_807(12,77,64);onnx_3A__3A_MatMul_5F_829(12,64,77)*output:onnx_3A__3A_Reshape_5F_830(12,77,77)
Reshape_336:Reshape*input:onnx_3A__3A_Reshape_5F_830(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_841(1,12,77,77)*allowzero:0
Add_337:Add*input:onnx_3A__3A_Add_5F_841(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_842(1,12,77,77)
Reshape_338:Reshape*input:onnx_3A__3A_Reshape_5F_842(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_23(12,77,77)*allowzero:0
Softmax_339:Softmax*input:attn_5F_weights_2E_23(12,77,77)*output:attn_5F_weights_2E_27(12,77,77)*axis:-1
MatMul_340:MatMul*input:attn_5F_weights_2E_27(12,77,77);onnx_3A__3A_MatMul_5F_827(12,77,64)*output:onnx_3A__3A_Reshape_5F_853(12,77,64)
Reshape_341:Reshape*input:onnx_3A__3A_Reshape_5F_853(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_865(1,12,77,64)*allowzero:0
Transpose_342:Transpose*input:onnx_3A__3A_Transpose_5F_865(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_866(1,77,12,64)*perm:0,2,1,3
Reshape_343:Reshape*input:onnx_3A__3A_Reshape_5F_866(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_874(1,77,768)*allowzero:0
MatMul_344:MatMul*input:onnx_3A__3A_MatMul_5F_874(1,77,768);onnx_3A__3A_MatMul_5F_2477.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_876(1,77,768)
Add_345:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_876(1,77,768)*output:onnx_3A__3A_Add_5F_877(1,77,768)
Add_346:Add*input:input_2E_31(1,77,768);onnx_3A__3A_Add_5F_877(1,77,768)*output:input_2E_35(1,77,768)
ReduceMean_347:ReduceMean*input:input_2E_35(1,77,768)*output:onnx_3A__3A_Sub_5F_879(1,77,1)*axes:-1
Sub_348:Sub*input:input_2E_35(1,77,768);onnx_3A__3A_Sub_5F_879(1,77,1)*output:onnx_3A__3A_Pow_5F_880(1,77,768)
Pow_350:Pow*input:onnx_3A__3A_Pow_5F_880(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_882(1,77,768)
ReduceMean_351:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_882(1,77,768)*output:onnx_3A__3A_Add_5F_883(1,77,1)*axes:-1
Add_353:Add*input:onnx_3A__3A_Add_5F_883(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_885(1,77,1)
Sqrt_354:Sqrt*input:onnx_3A__3A_Sqrt_5F_885(1,77,1)*output:onnx_3A__3A_Div_5F_886(1,77,1)
Div_355:Div*input:onnx_3A__3A_Pow_5F_880(1,77,768);onnx_3A__3A_Div_5F_886(1,77,1)*output:onnx_3A__3A_Mul_5F_887(1,77,768)
Mul_356:Mul*input:onnx_3A__3A_Mul_5F_887(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_888(1,77,768)
Add_357:Add*input:onnx_3A__3A_Add_5F_888(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_889(1,77,768)
MatMul_358:MatMul*input:onnx_3A__3A_MatMul_5F_889(1,77,768);onnx_3A__3A_MatMul_5F_2478.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_891(1,77,3072)
Add_359:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_891(1,77,3072)*output:onnx_3A__3A_Mul_5F_892(1,77,3072)
Mul_361:Mul*input:onnx_3A__3A_Mul_5F_892(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_894(1,77,3072)
Sigmoid_362:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_894(1,77,3072)*output:onnx_3A__3A_Mul_5F_895(1,77,3072)
Mul_363:Mul*input:onnx_3A__3A_Mul_5F_892(1,77,3072);onnx_3A__3A_Mul_5F_895(1,77,3072)*output:onnx_3A__3A_MatMul_5F_896(1,77,3072)
MatMul_364:MatMul*input:onnx_3A__3A_MatMul_5F_896(1,77,3072);onnx_3A__3A_MatMul_5F_2479.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_898(1,77,768)
Add_365:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_898(1,77,768)*output:onnx_3A__3A_Add_5F_899(1,77,768)
Add_366:Add*input:input_2E_35(1,77,768);onnx_3A__3A_Add_5F_899(1,77,768)*output:input_2E_39(1,77,768)
ReduceMean_367:ReduceMean*input:input_2E_39(1,77,768)*output:onnx_3A__3A_Sub_5F_901(1,77,1)*axes:-1
Sub_368:Sub*input:input_2E_39(1,77,768);onnx_3A__3A_Sub_5F_901(1,77,1)*output:onnx_3A__3A_Pow_5F_902(1,77,768)
Pow_370:Pow*input:onnx_3A__3A_Pow_5F_902(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_904(1,77,768)
ReduceMean_371:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_904(1,77,768)*output:onnx_3A__3A_Add_5F_905(1,77,1)*axes:-1
Add_373:Add*input:onnx_3A__3A_Add_5F_905(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_907(1,77,1)
Sqrt_374:Sqrt*input:onnx_3A__3A_Sqrt_5F_907(1,77,1)*output:onnx_3A__3A_Div_5F_908(1,77,1)
Div_375:Div*input:onnx_3A__3A_Pow_5F_902(1,77,768);onnx_3A__3A_Div_5F_908(1,77,1)*output:onnx_3A__3A_Mul_5F_909(1,77,768)
Mul_376:Mul*input:onnx_3A__3A_Mul_5F_909(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_910(1,77,768)
Add_377:Add*input:onnx_3A__3A_Add_5F_910(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_911(1,77,768)
MatMul_378:MatMul*input:onnx_3A__3A_MatMul_5F_911(1,77,768);onnx_3A__3A_MatMul_5F_2480.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_916(1,77,768)
Add_379:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_916(1,77,768)*output:onnx_3A__3A_Mul_5F_917(1,77,768)
Mul_381:Mul*input:onnx_3A__3A_Mul_5F_917(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_15(1,77,768)
MatMul_382:MatMul*input:onnx_3A__3A_MatMul_5F_911(1,77,768);onnx_3A__3A_MatMul_5F_2481.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_921(1,77,768)
Add_383:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_921(1,77,768)*output:onnx_3A__3A_Reshape_5F_922(1,77,768)
Reshape_384:Reshape*input:onnx_3A__3A_Reshape_5F_922(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_935(1,77,12,64)*allowzero:0
Transpose_385:Transpose*input:onnx_3A__3A_Transpose_5F_935(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_936(1,12,77,64)*perm:0,2,1,3
MatMul_386:MatMul*input:onnx_3A__3A_MatMul_5F_911(1,77,768);onnx_3A__3A_MatMul_5F_2487.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_938(1,77,768)
Add_387:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_938(1,77,768)*output:onnx_3A__3A_Reshape_5F_939(1,77,768)
Reshape_388:Reshape*input:onnx_3A__3A_Reshape_5F_939(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_952(1,77,12,64)*allowzero:0
Transpose_389:Transpose*input:onnx_3A__3A_Transpose_5F_952(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_953(1,12,77,64)*perm:0,2,1,3
Reshape_390:Reshape*input:query_5F_states_2E_15(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_966(1,77,12,64)*allowzero:0
Transpose_391:Transpose*input:onnx_3A__3A_Transpose_5F_966(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_967(1,12,77,64)*perm:0,2,1,3
Reshape_392:Reshape*input:onnx_3A__3A_Reshape_5F_967(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_977(12,77,64)*allowzero:0
Reshape_393:Reshape*input:onnx_3A__3A_Reshape_5F_936(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_987(12,77,64)*allowzero:0
Reshape_394:Reshape*input:onnx_3A__3A_Reshape_5F_953(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_997(12,77,64)*allowzero:0
Transpose_395:Transpose*input:onnx_3A__3A_Transpose_5F_987(12,77,64)*output:onnx_3A__3A_MatMul_5F_999(12,64,77)*perm:0,2,1
MatMul_396:MatMul*input:onnx_3A__3A_MatMul_5F_977(12,77,64);onnx_3A__3A_MatMul_5F_999(12,64,77)*output:onnx_3A__3A_Reshape_5F_1000(12,77,77)
Reshape_397:Reshape*input:onnx_3A__3A_Reshape_5F_1000(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1011(1,12,77,77)*allowzero:0
Add_398:Add*input:onnx_3A__3A_Add_5F_1011(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1012(1,12,77,77)
Reshape_399:Reshape*input:onnx_3A__3A_Reshape_5F_1012(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_31(12,77,77)*allowzero:0
Softmax_400:Softmax*input:attn_5F_weights_2E_31(12,77,77)*output:attn_5F_weights_2E_35(12,77,77)*axis:-1
MatMul_401:MatMul*input:attn_5F_weights_2E_35(12,77,77);onnx_3A__3A_MatMul_5F_997(12,77,64)*output:onnx_3A__3A_Reshape_5F_1023(12,77,64)
Reshape_402:Reshape*input:onnx_3A__3A_Reshape_5F_1023(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1035(1,12,77,64)*allowzero:0
Transpose_403:Transpose*input:onnx_3A__3A_Transpose_5F_1035(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1036(1,77,12,64)*perm:0,2,1,3
Reshape_404:Reshape*input:onnx_3A__3A_Reshape_5F_1036(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1044(1,77,768)*allowzero:0
MatMul_405:MatMul*input:onnx_3A__3A_MatMul_5F_1044(1,77,768);onnx_3A__3A_MatMul_5F_2528.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1046(1,77,768)
Add_406:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1046(1,77,768)*output:onnx_3A__3A_Add_5F_1047(1,77,768)
Add_407:Add*input:input_2E_39(1,77,768);onnx_3A__3A_Add_5F_1047(1,77,768)*output:input_2E_43(1,77,768)
ReduceMean_408:ReduceMean*input:input_2E_43(1,77,768)*output:onnx_3A__3A_Sub_5F_1049(1,77,1)*axes:-1
Sub_409:Sub*input:input_2E_43(1,77,768);onnx_3A__3A_Sub_5F_1049(1,77,1)*output:onnx_3A__3A_Pow_5F_1050(1,77,768)
Pow_411:Pow*input:onnx_3A__3A_Pow_5F_1050(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1052(1,77,768)
ReduceMean_412:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1052(1,77,768)*output:onnx_3A__3A_Add_5F_1053(1,77,1)*axes:-1
Add_414:Add*input:onnx_3A__3A_Add_5F_1053(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1055(1,77,1)
Sqrt_415:Sqrt*input:onnx_3A__3A_Sqrt_5F_1055(1,77,1)*output:onnx_3A__3A_Div_5F_1056(1,77,1)
Div_416:Div*input:onnx_3A__3A_Pow_5F_1050(1,77,768);onnx_3A__3A_Div_5F_1056(1,77,1)*output:onnx_3A__3A_Mul_5F_1057(1,77,768)
Mul_417:Mul*input:onnx_3A__3A_Mul_5F_1057(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1058(1,77,768)
Add_418:Add*input:onnx_3A__3A_Add_5F_1058(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1059(1,77,768)
MatMul_419:MatMul*input:onnx_3A__3A_MatMul_5F_1059(1,77,768);onnx_3A__3A_MatMul_5F_2529.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1061(1,77,3072)
Add_420:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1061(1,77,3072)*output:onnx_3A__3A_Mul_5F_1062(1,77,3072)
Mul_422:Mul*input:onnx_3A__3A_Mul_5F_1062(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1064(1,77,3072)
Sigmoid_423:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1064(1,77,3072)*output:onnx_3A__3A_Mul_5F_1065(1,77,3072)
Mul_424:Mul*input:onnx_3A__3A_Mul_5F_1062(1,77,3072);onnx_3A__3A_Mul_5F_1065(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1066(1,77,3072)
MatMul_425:MatMul*input:onnx_3A__3A_MatMul_5F_1066(1,77,3072);onnx_3A__3A_MatMul_5F_2530.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1068(1,77,768)
Add_426:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1068(1,77,768)*output:onnx_3A__3A_Add_5F_1069(1,77,768)
Add_427:Add*input:input_2E_43(1,77,768);onnx_3A__3A_Add_5F_1069(1,77,768)*output:input_2E_47(1,77,768)
ReduceMean_428:ReduceMean*input:input_2E_47(1,77,768)*output:onnx_3A__3A_Sub_5F_1071(1,77,1)*axes:-1
Sub_429:Sub*input:input_2E_47(1,77,768);onnx_3A__3A_Sub_5F_1071(1,77,1)*output:onnx_3A__3A_Pow_5F_1072(1,77,768)
Pow_431:Pow*input:onnx_3A__3A_Pow_5F_1072(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1074(1,77,768)
ReduceMean_432:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1074(1,77,768)*output:onnx_3A__3A_Add_5F_1075(1,77,1)*axes:-1
Add_434:Add*input:onnx_3A__3A_Add_5F_1075(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1077(1,77,1)
Sqrt_435:Sqrt*input:onnx_3A__3A_Sqrt_5F_1077(1,77,1)*output:onnx_3A__3A_Div_5F_1078(1,77,1)
Div_436:Div*input:onnx_3A__3A_Pow_5F_1072(1,77,768);onnx_3A__3A_Div_5F_1078(1,77,1)*output:onnx_3A__3A_Mul_5F_1079(1,77,768)
Mul_437:Mul*input:onnx_3A__3A_Mul_5F_1079(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1080(1,77,768)
Add_438:Add*input:onnx_3A__3A_Add_5F_1080(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1081(1,77,768)
MatMul_439:MatMul*input:onnx_3A__3A_MatMul_5F_1081(1,77,768);onnx_3A__3A_MatMul_5F_2531.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1086(1,77,768)
Add_440:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1086(1,77,768)*output:onnx_3A__3A_Mul_5F_1087(1,77,768)
Mul_442:Mul*input:onnx_3A__3A_Mul_5F_1087(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_19(1,77,768)
MatMul_443:MatMul*input:onnx_3A__3A_MatMul_5F_1081(1,77,768);onnx_3A__3A_MatMul_5F_2532.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1091(1,77,768)
Add_444:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1091(1,77,768)*output:onnx_3A__3A_Reshape_5F_1092(1,77,768)
Reshape_445:Reshape*input:onnx_3A__3A_Reshape_5F_1092(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1105(1,77,12,64)*allowzero:0
Transpose_446:Transpose*input:onnx_3A__3A_Transpose_5F_1105(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1106(1,12,77,64)*perm:0,2,1,3
MatMul_447:MatMul*input:onnx_3A__3A_MatMul_5F_1081(1,77,768);onnx_3A__3A_MatMul_5F_2538.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1108(1,77,768)
Add_448:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1108(1,77,768)*output:onnx_3A__3A_Reshape_5F_1109(1,77,768)
Reshape_449:Reshape*input:onnx_3A__3A_Reshape_5F_1109(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1122(1,77,12,64)*allowzero:0
Transpose_450:Transpose*input:onnx_3A__3A_Transpose_5F_1122(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1123(1,12,77,64)*perm:0,2,1,3
Reshape_451:Reshape*input:query_5F_states_2E_19(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1136(1,77,12,64)*allowzero:0
Transpose_452:Transpose*input:onnx_3A__3A_Transpose_5F_1136(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1137(1,12,77,64)*perm:0,2,1,3
Reshape_453:Reshape*input:onnx_3A__3A_Reshape_5F_1137(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1147(12,77,64)*allowzero:0
Reshape_454:Reshape*input:onnx_3A__3A_Reshape_5F_1106(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1157(12,77,64)*allowzero:0
Reshape_455:Reshape*input:onnx_3A__3A_Reshape_5F_1123(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1167(12,77,64)*allowzero:0
Transpose_456:Transpose*input:onnx_3A__3A_Transpose_5F_1157(12,77,64)*output:onnx_3A__3A_MatMul_5F_1169(12,64,77)*perm:0,2,1
MatMul_457:MatMul*input:onnx_3A__3A_MatMul_5F_1147(12,77,64);onnx_3A__3A_MatMul_5F_1169(12,64,77)*output:onnx_3A__3A_Reshape_5F_1170(12,77,77)
Reshape_458:Reshape*input:onnx_3A__3A_Reshape_5F_1170(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1181(1,12,77,77)*allowzero:0
Add_459:Add*input:onnx_3A__3A_Add_5F_1181(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1182(1,12,77,77)
Reshape_460:Reshape*input:onnx_3A__3A_Reshape_5F_1182(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_39(12,77,77)*allowzero:0
Softmax_461:Softmax*input:attn_5F_weights_2E_39(12,77,77)*output:attn_5F_weights_2E_43(12,77,77)*axis:-1
MatMul_462:MatMul*input:attn_5F_weights_2E_43(12,77,77);onnx_3A__3A_MatMul_5F_1167(12,77,64)*output:onnx_3A__3A_Reshape_5F_1193(12,77,64)
Reshape_463:Reshape*input:onnx_3A__3A_Reshape_5F_1193(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1205(1,12,77,64)*allowzero:0
Transpose_464:Transpose*input:onnx_3A__3A_Transpose_5F_1205(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1206(1,77,12,64)*perm:0,2,1,3
Reshape_465:Reshape*input:onnx_3A__3A_Reshape_5F_1206(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1214(1,77,768)*allowzero:0
MatMul_466:MatMul*input:onnx_3A__3A_MatMul_5F_1214(1,77,768);onnx_3A__3A_MatMul_5F_2579.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1216(1,77,768)
Add_467:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1216(1,77,768)*output:onnx_3A__3A_Add_5F_1217(1,77,768)
Add_468:Add*input:input_2E_47(1,77,768);onnx_3A__3A_Add_5F_1217(1,77,768)*output:input_2E_51(1,77,768)
ReduceMean_469:ReduceMean*input:input_2E_51(1,77,768)*output:onnx_3A__3A_Sub_5F_1219(1,77,1)*axes:-1
Sub_470:Sub*input:input_2E_51(1,77,768);onnx_3A__3A_Sub_5F_1219(1,77,1)*output:onnx_3A__3A_Pow_5F_1220(1,77,768)
Pow_472:Pow*input:onnx_3A__3A_Pow_5F_1220(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1222(1,77,768)
ReduceMean_473:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1222(1,77,768)*output:onnx_3A__3A_Add_5F_1223(1,77,1)*axes:-1
Add_475:Add*input:onnx_3A__3A_Add_5F_1223(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1225(1,77,1)
Sqrt_476:Sqrt*input:onnx_3A__3A_Sqrt_5F_1225(1,77,1)*output:onnx_3A__3A_Div_5F_1226(1,77,1)
Div_477:Div*input:onnx_3A__3A_Pow_5F_1220(1,77,768);onnx_3A__3A_Div_5F_1226(1,77,1)*output:onnx_3A__3A_Mul_5F_1227(1,77,768)
Mul_478:Mul*input:onnx_3A__3A_Mul_5F_1227(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1228(1,77,768)
Add_479:Add*input:onnx_3A__3A_Add_5F_1228(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1229(1,77,768)
MatMul_480:MatMul*input:onnx_3A__3A_MatMul_5F_1229(1,77,768);onnx_3A__3A_MatMul_5F_2580.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1231(1,77,3072)
Add_481:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1231(1,77,3072)*output:onnx_3A__3A_Mul_5F_1232(1,77,3072)
Mul_483:Mul*input:onnx_3A__3A_Mul_5F_1232(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1234(1,77,3072)
Sigmoid_484:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1234(1,77,3072)*output:onnx_3A__3A_Mul_5F_1235(1,77,3072)
Mul_485:Mul*input:onnx_3A__3A_Mul_5F_1232(1,77,3072);onnx_3A__3A_Mul_5F_1235(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1236(1,77,3072)
MatMul_486:MatMul*input:onnx_3A__3A_MatMul_5F_1236(1,77,3072);onnx_3A__3A_MatMul_5F_2581.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1238(1,77,768)
Add_487:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1238(1,77,768)*output:onnx_3A__3A_Add_5F_1239(1,77,768)
Add_488:Add*input:input_2E_51(1,77,768);onnx_3A__3A_Add_5F_1239(1,77,768)*output:input_2E_55(1,77,768)
ReduceMean_489:ReduceMean*input:input_2E_55(1,77,768)*output:onnx_3A__3A_Sub_5F_1241(1,77,1)*axes:-1
Sub_490:Sub*input:input_2E_55(1,77,768);onnx_3A__3A_Sub_5F_1241(1,77,1)*output:onnx_3A__3A_Pow_5F_1242(1,77,768)
Pow_492:Pow*input:onnx_3A__3A_Pow_5F_1242(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1244(1,77,768)
ReduceMean_493:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1244(1,77,768)*output:onnx_3A__3A_Add_5F_1245(1,77,1)*axes:-1
Add_495:Add*input:onnx_3A__3A_Add_5F_1245(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1247(1,77,1)
Sqrt_496:Sqrt*input:onnx_3A__3A_Sqrt_5F_1247(1,77,1)*output:onnx_3A__3A_Div_5F_1248(1,77,1)
Div_497:Div*input:onnx_3A__3A_Pow_5F_1242(1,77,768);onnx_3A__3A_Div_5F_1248(1,77,1)*output:onnx_3A__3A_Mul_5F_1249(1,77,768)
Mul_498:Mul*input:onnx_3A__3A_Mul_5F_1249(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1250(1,77,768)
Add_499:Add*input:onnx_3A__3A_Add_5F_1250(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1251(1,77,768)
MatMul_500:MatMul*input:onnx_3A__3A_MatMul_5F_1251(1,77,768);onnx_3A__3A_MatMul_5F_2582.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1256(1,77,768)
Add_501:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1256(1,77,768)*output:onnx_3A__3A_Mul_5F_1257(1,77,768)
Mul_503:Mul*input:onnx_3A__3A_Mul_5F_1257(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_23(1,77,768)
MatMul_504:MatMul*input:onnx_3A__3A_MatMul_5F_1251(1,77,768);onnx_3A__3A_MatMul_5F_2583.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1261(1,77,768)
Add_505:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1261(1,77,768)*output:onnx_3A__3A_Reshape_5F_1262(1,77,768)
Reshape_506:Reshape*input:onnx_3A__3A_Reshape_5F_1262(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1275(1,77,12,64)*allowzero:0
Transpose_507:Transpose*input:onnx_3A__3A_Transpose_5F_1275(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1276(1,12,77,64)*perm:0,2,1,3
MatMul_508:MatMul*input:onnx_3A__3A_MatMul_5F_1251(1,77,768);onnx_3A__3A_MatMul_5F_2589.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1278(1,77,768)
Add_509:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1278(1,77,768)*output:onnx_3A__3A_Reshape_5F_1279(1,77,768)
Reshape_510:Reshape*input:onnx_3A__3A_Reshape_5F_1279(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1292(1,77,12,64)*allowzero:0
Transpose_511:Transpose*input:onnx_3A__3A_Transpose_5F_1292(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1293(1,12,77,64)*perm:0,2,1,3
Reshape_512:Reshape*input:query_5F_states_2E_23(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1306(1,77,12,64)*allowzero:0
Transpose_513:Transpose*input:onnx_3A__3A_Transpose_5F_1306(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1307(1,12,77,64)*perm:0,2,1,3
Reshape_514:Reshape*input:onnx_3A__3A_Reshape_5F_1307(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1317(12,77,64)*allowzero:0
Reshape_515:Reshape*input:onnx_3A__3A_Reshape_5F_1276(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1327(12,77,64)*allowzero:0
Reshape_516:Reshape*input:onnx_3A__3A_Reshape_5F_1293(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1337(12,77,64)*allowzero:0
Transpose_517:Transpose*input:onnx_3A__3A_Transpose_5F_1327(12,77,64)*output:onnx_3A__3A_MatMul_5F_1339(12,64,77)*perm:0,2,1
MatMul_518:MatMul*input:onnx_3A__3A_MatMul_5F_1317(12,77,64);onnx_3A__3A_MatMul_5F_1339(12,64,77)*output:onnx_3A__3A_Reshape_5F_1340(12,77,77)
Reshape_519:Reshape*input:onnx_3A__3A_Reshape_5F_1340(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1351(1,12,77,77)*allowzero:0
Add_520:Add*input:onnx_3A__3A_Add_5F_1351(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1352(1,12,77,77)
Reshape_521:Reshape*input:onnx_3A__3A_Reshape_5F_1352(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_47(12,77,77)*allowzero:0
Softmax_522:Softmax*input:attn_5F_weights_2E_47(12,77,77)*output:attn_5F_weights_2E_51(12,77,77)*axis:-1
MatMul_523:MatMul*input:attn_5F_weights_2E_51(12,77,77);onnx_3A__3A_MatMul_5F_1337(12,77,64)*output:onnx_3A__3A_Reshape_5F_1363(12,77,64)
Reshape_524:Reshape*input:onnx_3A__3A_Reshape_5F_1363(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1375(1,12,77,64)*allowzero:0
Transpose_525:Transpose*input:onnx_3A__3A_Transpose_5F_1375(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1376(1,77,12,64)*perm:0,2,1,3
Reshape_526:Reshape*input:onnx_3A__3A_Reshape_5F_1376(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1384(1,77,768)*allowzero:0
MatMul_527:MatMul*input:onnx_3A__3A_MatMul_5F_1384(1,77,768);onnx_3A__3A_MatMul_5F_2630.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1386(1,77,768)
Add_528:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1386(1,77,768)*output:onnx_3A__3A_Add_5F_1387(1,77,768)
Add_529:Add*input:input_2E_55(1,77,768);onnx_3A__3A_Add_5F_1387(1,77,768)*output:input_2E_59(1,77,768)
ReduceMean_530:ReduceMean*input:input_2E_59(1,77,768)*output:onnx_3A__3A_Sub_5F_1389(1,77,1)*axes:-1
Sub_531:Sub*input:input_2E_59(1,77,768);onnx_3A__3A_Sub_5F_1389(1,77,1)*output:onnx_3A__3A_Pow_5F_1390(1,77,768)
Pow_533:Pow*input:onnx_3A__3A_Pow_5F_1390(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1392(1,77,768)
ReduceMean_534:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1392(1,77,768)*output:onnx_3A__3A_Add_5F_1393(1,77,1)*axes:-1
Add_536:Add*input:onnx_3A__3A_Add_5F_1393(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1395(1,77,1)
Sqrt_537:Sqrt*input:onnx_3A__3A_Sqrt_5F_1395(1,77,1)*output:onnx_3A__3A_Div_5F_1396(1,77,1)
Div_538:Div*input:onnx_3A__3A_Pow_5F_1390(1,77,768);onnx_3A__3A_Div_5F_1396(1,77,1)*output:onnx_3A__3A_Mul_5F_1397(1,77,768)
Mul_539:Mul*input:onnx_3A__3A_Mul_5F_1397(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1398(1,77,768)
Add_540:Add*input:onnx_3A__3A_Add_5F_1398(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1399(1,77,768)
MatMul_541:MatMul*input:onnx_3A__3A_MatMul_5F_1399(1,77,768);onnx_3A__3A_MatMul_5F_2631.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1401(1,77,3072)
Add_542:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1401(1,77,3072)*output:onnx_3A__3A_Mul_5F_1402(1,77,3072)
Mul_544:Mul*input:onnx_3A__3A_Mul_5F_1402(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1404(1,77,3072)
Sigmoid_545:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1404(1,77,3072)*output:onnx_3A__3A_Mul_5F_1405(1,77,3072)
Mul_546:Mul*input:onnx_3A__3A_Mul_5F_1402(1,77,3072);onnx_3A__3A_Mul_5F_1405(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1406(1,77,3072)
MatMul_547:MatMul*input:onnx_3A__3A_MatMul_5F_1406(1,77,3072);onnx_3A__3A_MatMul_5F_2632.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1408(1,77,768)
Add_548:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1408(1,77,768)*output:onnx_3A__3A_Add_5F_1409(1,77,768)
Add_549:Add*input:input_2E_59(1,77,768);onnx_3A__3A_Add_5F_1409(1,77,768)*output:input_2E_63(1,77,768)
ReduceMean_550:ReduceMean*input:input_2E_63(1,77,768)*output:onnx_3A__3A_Sub_5F_1411(1,77,1)*axes:-1
Sub_551:Sub*input:input_2E_63(1,77,768);onnx_3A__3A_Sub_5F_1411(1,77,1)*output:onnx_3A__3A_Pow_5F_1412(1,77,768)
Pow_553:Pow*input:onnx_3A__3A_Pow_5F_1412(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1414(1,77,768)
ReduceMean_554:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1414(1,77,768)*output:onnx_3A__3A_Add_5F_1415(1,77,1)*axes:-1
Add_556:Add*input:onnx_3A__3A_Add_5F_1415(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1417(1,77,1)
Sqrt_557:Sqrt*input:onnx_3A__3A_Sqrt_5F_1417(1,77,1)*output:onnx_3A__3A_Div_5F_1418(1,77,1)
Div_558:Div*input:onnx_3A__3A_Pow_5F_1412(1,77,768);onnx_3A__3A_Div_5F_1418(1,77,1)*output:onnx_3A__3A_Mul_5F_1419(1,77,768)
Mul_559:Mul*input:onnx_3A__3A_Mul_5F_1419(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1420(1,77,768)
Add_560:Add*input:onnx_3A__3A_Add_5F_1420(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1421(1,77,768)
MatMul_561:MatMul*input:onnx_3A__3A_MatMul_5F_1421(1,77,768);onnx_3A__3A_MatMul_5F_2633.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1426(1,77,768)
Add_562:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1426(1,77,768)*output:onnx_3A__3A_Mul_5F_1427(1,77,768)
Mul_564:Mul*input:onnx_3A__3A_Mul_5F_1427(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_27(1,77,768)
MatMul_565:MatMul*input:onnx_3A__3A_MatMul_5F_1421(1,77,768);onnx_3A__3A_MatMul_5F_2634.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1431(1,77,768)
Add_566:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1431(1,77,768)*output:onnx_3A__3A_Reshape_5F_1432(1,77,768)
Reshape_567:Reshape*input:onnx_3A__3A_Reshape_5F_1432(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1445(1,77,12,64)*allowzero:0
Transpose_568:Transpose*input:onnx_3A__3A_Transpose_5F_1445(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1446(1,12,77,64)*perm:0,2,1,3
MatMul_569:MatMul*input:onnx_3A__3A_MatMul_5F_1421(1,77,768);onnx_3A__3A_MatMul_5F_2640.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1448(1,77,768)
Add_570:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1448(1,77,768)*output:onnx_3A__3A_Reshape_5F_1449(1,77,768)
Reshape_571:Reshape*input:onnx_3A__3A_Reshape_5F_1449(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1462(1,77,12,64)*allowzero:0
Transpose_572:Transpose*input:onnx_3A__3A_Transpose_5F_1462(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1463(1,12,77,64)*perm:0,2,1,3
Reshape_573:Reshape*input:query_5F_states_2E_27(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1476(1,77,12,64)*allowzero:0
Transpose_574:Transpose*input:onnx_3A__3A_Transpose_5F_1476(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1477(1,12,77,64)*perm:0,2,1,3
Reshape_575:Reshape*input:onnx_3A__3A_Reshape_5F_1477(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1487(12,77,64)*allowzero:0
Reshape_576:Reshape*input:onnx_3A__3A_Reshape_5F_1446(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1497(12,77,64)*allowzero:0
Reshape_577:Reshape*input:onnx_3A__3A_Reshape_5F_1463(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1507(12,77,64)*allowzero:0
Transpose_578:Transpose*input:onnx_3A__3A_Transpose_5F_1497(12,77,64)*output:onnx_3A__3A_MatMul_5F_1509(12,64,77)*perm:0,2,1
MatMul_579:MatMul*input:onnx_3A__3A_MatMul_5F_1487(12,77,64);onnx_3A__3A_MatMul_5F_1509(12,64,77)*output:onnx_3A__3A_Reshape_5F_1510(12,77,77)
Reshape_580:Reshape*input:onnx_3A__3A_Reshape_5F_1510(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1521(1,12,77,77)*allowzero:0
Add_581:Add*input:onnx_3A__3A_Add_5F_1521(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1522(1,12,77,77)
Reshape_582:Reshape*input:onnx_3A__3A_Reshape_5F_1522(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_55(12,77,77)*allowzero:0
Softmax_583:Softmax*input:attn_5F_weights_2E_55(12,77,77)*output:attn_5F_weights_2E_59(12,77,77)*axis:-1
MatMul_584:MatMul*input:attn_5F_weights_2E_59(12,77,77);onnx_3A__3A_MatMul_5F_1507(12,77,64)*output:onnx_3A__3A_Reshape_5F_1533(12,77,64)
Reshape_585:Reshape*input:onnx_3A__3A_Reshape_5F_1533(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1545(1,12,77,64)*allowzero:0
Transpose_586:Transpose*input:onnx_3A__3A_Transpose_5F_1545(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1546(1,77,12,64)*perm:0,2,1,3
Reshape_587:Reshape*input:onnx_3A__3A_Reshape_5F_1546(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1554(1,77,768)*allowzero:0
MatMul_588:MatMul*input:onnx_3A__3A_MatMul_5F_1554(1,77,768);onnx_3A__3A_MatMul_5F_2681.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1556(1,77,768)
Add_589:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1556(1,77,768)*output:onnx_3A__3A_Add_5F_1557(1,77,768)
Add_590:Add*input:input_2E_63(1,77,768);onnx_3A__3A_Add_5F_1557(1,77,768)*output:input_2E_67(1,77,768)
ReduceMean_591:ReduceMean*input:input_2E_67(1,77,768)*output:onnx_3A__3A_Sub_5F_1559(1,77,1)*axes:-1
Sub_592:Sub*input:input_2E_67(1,77,768);onnx_3A__3A_Sub_5F_1559(1,77,1)*output:onnx_3A__3A_Pow_5F_1560(1,77,768)
Pow_594:Pow*input:onnx_3A__3A_Pow_5F_1560(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1562(1,77,768)
ReduceMean_595:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1562(1,77,768)*output:onnx_3A__3A_Add_5F_1563(1,77,1)*axes:-1
Add_597:Add*input:onnx_3A__3A_Add_5F_1563(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1565(1,77,1)
Sqrt_598:Sqrt*input:onnx_3A__3A_Sqrt_5F_1565(1,77,1)*output:onnx_3A__3A_Div_5F_1566(1,77,1)
Div_599:Div*input:onnx_3A__3A_Pow_5F_1560(1,77,768);onnx_3A__3A_Div_5F_1566(1,77,1)*output:onnx_3A__3A_Mul_5F_1567(1,77,768)
Mul_600:Mul*input:onnx_3A__3A_Mul_5F_1567(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1568(1,77,768)
Add_601:Add*input:onnx_3A__3A_Add_5F_1568(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1569(1,77,768)
MatMul_602:MatMul*input:onnx_3A__3A_MatMul_5F_1569(1,77,768);onnx_3A__3A_MatMul_5F_2682.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1571(1,77,3072)
Add_603:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1571(1,77,3072)*output:onnx_3A__3A_Mul_5F_1572(1,77,3072)
Mul_605:Mul*input:onnx_3A__3A_Mul_5F_1572(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1574(1,77,3072)
Sigmoid_606:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1574(1,77,3072)*output:onnx_3A__3A_Mul_5F_1575(1,77,3072)
Mul_607:Mul*input:onnx_3A__3A_Mul_5F_1572(1,77,3072);onnx_3A__3A_Mul_5F_1575(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1576(1,77,3072)
MatMul_608:MatMul*input:onnx_3A__3A_MatMul_5F_1576(1,77,3072);onnx_3A__3A_MatMul_5F_2683.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1578(1,77,768)
Add_609:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1578(1,77,768)*output:onnx_3A__3A_Add_5F_1579(1,77,768)
Add_610:Add*input:input_2E_67(1,77,768);onnx_3A__3A_Add_5F_1579(1,77,768)*output:input_2E_71(1,77,768)
ReduceMean_611:ReduceMean*input:input_2E_71(1,77,768)*output:onnx_3A__3A_Sub_5F_1581(1,77,1)*axes:-1
Sub_612:Sub*input:input_2E_71(1,77,768);onnx_3A__3A_Sub_5F_1581(1,77,1)*output:onnx_3A__3A_Pow_5F_1582(1,77,768)
Pow_614:Pow*input:onnx_3A__3A_Pow_5F_1582(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1584(1,77,768)
ReduceMean_615:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1584(1,77,768)*output:onnx_3A__3A_Add_5F_1585(1,77,1)*axes:-1
Add_617:Add*input:onnx_3A__3A_Add_5F_1585(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1587(1,77,1)
Sqrt_618:Sqrt*input:onnx_3A__3A_Sqrt_5F_1587(1,77,1)*output:onnx_3A__3A_Div_5F_1588(1,77,1)
Div_619:Div*input:onnx_3A__3A_Pow_5F_1582(1,77,768);onnx_3A__3A_Div_5F_1588(1,77,1)*output:onnx_3A__3A_Mul_5F_1589(1,77,768)
Mul_620:Mul*input:onnx_3A__3A_Mul_5F_1589(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1590(1,77,768)
Add_621:Add*input:onnx_3A__3A_Add_5F_1590(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1591(1,77,768)
MatMul_622:MatMul*input:onnx_3A__3A_MatMul_5F_1591(1,77,768);onnx_3A__3A_MatMul_5F_2684.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1596(1,77,768)
Add_623:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1596(1,77,768)*output:onnx_3A__3A_Mul_5F_1597(1,77,768)
Mul_625:Mul*input:onnx_3A__3A_Mul_5F_1597(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_31(1,77,768)
MatMul_626:MatMul*input:onnx_3A__3A_MatMul_5F_1591(1,77,768);onnx_3A__3A_MatMul_5F_2685.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1601(1,77,768)
Add_627:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1601(1,77,768)*output:onnx_3A__3A_Reshape_5F_1602(1,77,768)
Reshape_628:Reshape*input:onnx_3A__3A_Reshape_5F_1602(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1615(1,77,12,64)*allowzero:0
Transpose_629:Transpose*input:onnx_3A__3A_Transpose_5F_1615(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1616(1,12,77,64)*perm:0,2,1,3
MatMul_630:MatMul*input:onnx_3A__3A_MatMul_5F_1591(1,77,768);onnx_3A__3A_MatMul_5F_2691.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1618(1,77,768)
Add_631:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1618(1,77,768)*output:onnx_3A__3A_Reshape_5F_1619(1,77,768)
Reshape_632:Reshape*input:onnx_3A__3A_Reshape_5F_1619(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1632(1,77,12,64)*allowzero:0
Transpose_633:Transpose*input:onnx_3A__3A_Transpose_5F_1632(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1633(1,12,77,64)*perm:0,2,1,3
Reshape_634:Reshape*input:query_5F_states_2E_31(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1646(1,77,12,64)*allowzero:0
Transpose_635:Transpose*input:onnx_3A__3A_Transpose_5F_1646(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1647(1,12,77,64)*perm:0,2,1,3
Reshape_636:Reshape*input:onnx_3A__3A_Reshape_5F_1647(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1657(12,77,64)*allowzero:0
Reshape_637:Reshape*input:onnx_3A__3A_Reshape_5F_1616(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1667(12,77,64)*allowzero:0
Reshape_638:Reshape*input:onnx_3A__3A_Reshape_5F_1633(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1677(12,77,64)*allowzero:0
Transpose_639:Transpose*input:onnx_3A__3A_Transpose_5F_1667(12,77,64)*output:onnx_3A__3A_MatMul_5F_1679(12,64,77)*perm:0,2,1
MatMul_640:MatMul*input:onnx_3A__3A_MatMul_5F_1657(12,77,64);onnx_3A__3A_MatMul_5F_1679(12,64,77)*output:onnx_3A__3A_Reshape_5F_1680(12,77,77)
Reshape_641:Reshape*input:onnx_3A__3A_Reshape_5F_1680(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1691(1,12,77,77)*allowzero:0
Add_642:Add*input:onnx_3A__3A_Add_5F_1691(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1692(1,12,77,77)
Reshape_643:Reshape*input:onnx_3A__3A_Reshape_5F_1692(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_63(12,77,77)*allowzero:0
Softmax_644:Softmax*input:attn_5F_weights_2E_63(12,77,77)*output:attn_5F_weights_2E_67(12,77,77)*axis:-1
MatMul_645:MatMul*input:attn_5F_weights_2E_67(12,77,77);onnx_3A__3A_MatMul_5F_1677(12,77,64)*output:onnx_3A__3A_Reshape_5F_1703(12,77,64)
Reshape_646:Reshape*input:onnx_3A__3A_Reshape_5F_1703(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1715(1,12,77,64)*allowzero:0
Transpose_647:Transpose*input:onnx_3A__3A_Transpose_5F_1715(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1716(1,77,12,64)*perm:0,2,1,3
Reshape_648:Reshape*input:onnx_3A__3A_Reshape_5F_1716(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1724(1,77,768)*allowzero:0
MatMul_649:MatMul*input:onnx_3A__3A_MatMul_5F_1724(1,77,768);onnx_3A__3A_MatMul_5F_2732.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1726(1,77,768)
Add_650:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1726(1,77,768)*output:onnx_3A__3A_Add_5F_1727(1,77,768)
Add_651:Add*input:input_2E_71(1,77,768);onnx_3A__3A_Add_5F_1727(1,77,768)*output:input_2E_75(1,77,768)
ReduceMean_652:ReduceMean*input:input_2E_75(1,77,768)*output:onnx_3A__3A_Sub_5F_1729(1,77,1)*axes:-1
Sub_653:Sub*input:input_2E_75(1,77,768);onnx_3A__3A_Sub_5F_1729(1,77,1)*output:onnx_3A__3A_Pow_5F_1730(1,77,768)
Pow_655:Pow*input:onnx_3A__3A_Pow_5F_1730(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1732(1,77,768)
ReduceMean_656:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1732(1,77,768)*output:onnx_3A__3A_Add_5F_1733(1,77,1)*axes:-1
Add_658:Add*input:onnx_3A__3A_Add_5F_1733(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1735(1,77,1)
Sqrt_659:Sqrt*input:onnx_3A__3A_Sqrt_5F_1735(1,77,1)*output:onnx_3A__3A_Div_5F_1736(1,77,1)
Div_660:Div*input:onnx_3A__3A_Pow_5F_1730(1,77,768);onnx_3A__3A_Div_5F_1736(1,77,1)*output:onnx_3A__3A_Mul_5F_1737(1,77,768)
Mul_661:Mul*input:onnx_3A__3A_Mul_5F_1737(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1738(1,77,768)
Add_662:Add*input:onnx_3A__3A_Add_5F_1738(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1739(1,77,768)
MatMul_663:MatMul*input:onnx_3A__3A_MatMul_5F_1739(1,77,768);onnx_3A__3A_MatMul_5F_2733.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1741(1,77,3072)
Add_664:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1741(1,77,3072)*output:onnx_3A__3A_Mul_5F_1742(1,77,3072)
Mul_666:Mul*input:onnx_3A__3A_Mul_5F_1742(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1744(1,77,3072)
Sigmoid_667:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1744(1,77,3072)*output:onnx_3A__3A_Mul_5F_1745(1,77,3072)
Mul_668:Mul*input:onnx_3A__3A_Mul_5F_1742(1,77,3072);onnx_3A__3A_Mul_5F_1745(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1746(1,77,3072)
MatMul_669:MatMul*input:onnx_3A__3A_MatMul_5F_1746(1,77,3072);onnx_3A__3A_MatMul_5F_2734.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1748(1,77,768)
Add_670:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1748(1,77,768)*output:onnx_3A__3A_Add_5F_1749(1,77,768)
Add_671:Add*input:input_2E_75(1,77,768);onnx_3A__3A_Add_5F_1749(1,77,768)*output:input_2E_79(1,77,768)
ReduceMean_672:ReduceMean*input:input_2E_79(1,77,768)*output:onnx_3A__3A_Sub_5F_1751(1,77,1)*axes:-1
Sub_673:Sub*input:input_2E_79(1,77,768);onnx_3A__3A_Sub_5F_1751(1,77,1)*output:onnx_3A__3A_Pow_5F_1752(1,77,768)
Pow_675:Pow*input:onnx_3A__3A_Pow_5F_1752(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1754(1,77,768)
ReduceMean_676:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1754(1,77,768)*output:onnx_3A__3A_Add_5F_1755(1,77,1)*axes:-1
Add_678:Add*input:onnx_3A__3A_Add_5F_1755(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1757(1,77,1)
Sqrt_679:Sqrt*input:onnx_3A__3A_Sqrt_5F_1757(1,77,1)*output:onnx_3A__3A_Div_5F_1758(1,77,1)
Div_680:Div*input:onnx_3A__3A_Pow_5F_1752(1,77,768);onnx_3A__3A_Div_5F_1758(1,77,1)*output:onnx_3A__3A_Mul_5F_1759(1,77,768)
Mul_681:Mul*input:onnx_3A__3A_Mul_5F_1759(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1760(1,77,768)
Add_682:Add*input:onnx_3A__3A_Add_5F_1760(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1761(1,77,768)
MatMul_683:MatMul*input:onnx_3A__3A_MatMul_5F_1761(1,77,768);onnx_3A__3A_MatMul_5F_2735.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1766(1,77,768)
Add_684:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1766(1,77,768)*output:onnx_3A__3A_Mul_5F_1767(1,77,768)
Mul_686:Mul*input:onnx_3A__3A_Mul_5F_1767(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_35(1,77,768)
MatMul_687:MatMul*input:onnx_3A__3A_MatMul_5F_1761(1,77,768);onnx_3A__3A_MatMul_5F_2736.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1771(1,77,768)
Add_688:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1771(1,77,768)*output:onnx_3A__3A_Reshape_5F_1772(1,77,768)
Reshape_689:Reshape*input:onnx_3A__3A_Reshape_5F_1772(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1785(1,77,12,64)*allowzero:0
Transpose_690:Transpose*input:onnx_3A__3A_Transpose_5F_1785(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1786(1,12,77,64)*perm:0,2,1,3
MatMul_691:MatMul*input:onnx_3A__3A_MatMul_5F_1761(1,77,768);onnx_3A__3A_MatMul_5F_2742.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1788(1,77,768)
Add_692:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1788(1,77,768)*output:onnx_3A__3A_Reshape_5F_1789(1,77,768)
Reshape_693:Reshape*input:onnx_3A__3A_Reshape_5F_1789(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1802(1,77,12,64)*allowzero:0
Transpose_694:Transpose*input:onnx_3A__3A_Transpose_5F_1802(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1803(1,12,77,64)*perm:0,2,1,3
Reshape_695:Reshape*input:query_5F_states_2E_35(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1816(1,77,12,64)*allowzero:0
Transpose_696:Transpose*input:onnx_3A__3A_Transpose_5F_1816(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1817(1,12,77,64)*perm:0,2,1,3
Reshape_697:Reshape*input:onnx_3A__3A_Reshape_5F_1817(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1827(12,77,64)*allowzero:0
Reshape_698:Reshape*input:onnx_3A__3A_Reshape_5F_1786(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1837(12,77,64)*allowzero:0
Reshape_699:Reshape*input:onnx_3A__3A_Reshape_5F_1803(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1847(12,77,64)*allowzero:0
Transpose_700:Transpose*input:onnx_3A__3A_Transpose_5F_1837(12,77,64)*output:onnx_3A__3A_MatMul_5F_1849(12,64,77)*perm:0,2,1
MatMul_701:MatMul*input:onnx_3A__3A_MatMul_5F_1827(12,77,64);onnx_3A__3A_MatMul_5F_1849(12,64,77)*output:onnx_3A__3A_Reshape_5F_1850(12,77,77)
Reshape_702:Reshape*input:onnx_3A__3A_Reshape_5F_1850(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1861(1,12,77,77)*allowzero:0
Add_703:Add*input:onnx_3A__3A_Add_5F_1861(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1862(1,12,77,77)
Reshape_704:Reshape*input:onnx_3A__3A_Reshape_5F_1862(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_71(12,77,77)*allowzero:0
Softmax_705:Softmax*input:attn_5F_weights_2E_71(12,77,77)*output:attn_5F_weights_2E_75(12,77,77)*axis:-1
MatMul_706:MatMul*input:attn_5F_weights_2E_75(12,77,77);onnx_3A__3A_MatMul_5F_1847(12,77,64)*output:onnx_3A__3A_Reshape_5F_1873(12,77,64)
Reshape_707:Reshape*input:onnx_3A__3A_Reshape_5F_1873(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1885(1,12,77,64)*allowzero:0
Transpose_708:Transpose*input:onnx_3A__3A_Transpose_5F_1885(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1886(1,77,12,64)*perm:0,2,1,3
Reshape_709:Reshape*input:onnx_3A__3A_Reshape_5F_1886(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1894(1,77,768)*allowzero:0
MatMul_710:MatMul*input:onnx_3A__3A_MatMul_5F_1894(1,77,768);onnx_3A__3A_MatMul_5F_2783.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1896(1,77,768)
Add_711:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1896(1,77,768)*output:onnx_3A__3A_Add_5F_1897(1,77,768)
Add_712:Add*input:input_2E_79(1,77,768);onnx_3A__3A_Add_5F_1897(1,77,768)*output:input_2E_83(1,77,768)
ReduceMean_713:ReduceMean*input:input_2E_83(1,77,768)*output:onnx_3A__3A_Sub_5F_1899(1,77,1)*axes:-1
Sub_714:Sub*input:input_2E_83(1,77,768);onnx_3A__3A_Sub_5F_1899(1,77,1)*output:onnx_3A__3A_Pow_5F_1900(1,77,768)
Pow_716:Pow*input:onnx_3A__3A_Pow_5F_1900(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1902(1,77,768)
ReduceMean_717:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1902(1,77,768)*output:onnx_3A__3A_Add_5F_1903(1,77,1)*axes:-1
Add_719:Add*input:onnx_3A__3A_Add_5F_1903(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1905(1,77,1)
Sqrt_720:Sqrt*input:onnx_3A__3A_Sqrt_5F_1905(1,77,1)*output:onnx_3A__3A_Div_5F_1906(1,77,1)
Div_721:Div*input:onnx_3A__3A_Pow_5F_1900(1,77,768);onnx_3A__3A_Div_5F_1906(1,77,1)*output:onnx_3A__3A_Mul_5F_1907(1,77,768)
Mul_722:Mul*input:onnx_3A__3A_Mul_5F_1907(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1908(1,77,768)
Add_723:Add*input:onnx_3A__3A_Add_5F_1908(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1909(1,77,768)
MatMul_724:MatMul*input:onnx_3A__3A_MatMul_5F_1909(1,77,768);onnx_3A__3A_MatMul_5F_2784.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1911(1,77,3072)
Add_725:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1911(1,77,3072)*output:onnx_3A__3A_Mul_5F_1912(1,77,3072)
Mul_727:Mul*input:onnx_3A__3A_Mul_5F_1912(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1914(1,77,3072)
Sigmoid_728:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1914(1,77,3072)*output:onnx_3A__3A_Mul_5F_1915(1,77,3072)
Mul_729:Mul*input:onnx_3A__3A_Mul_5F_1912(1,77,3072);onnx_3A__3A_Mul_5F_1915(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1916(1,77,3072)
MatMul_730:MatMul*input:onnx_3A__3A_MatMul_5F_1916(1,77,3072);onnx_3A__3A_MatMul_5F_2785.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1918(1,77,768)
Add_731:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1918(1,77,768)*output:onnx_3A__3A_Add_5F_1919(1,77,768)
Add_732:Add*input:input_2E_83(1,77,768);onnx_3A__3A_Add_5F_1919(1,77,768)*output:input_2E_87(1,77,768)
ReduceMean_733:ReduceMean*input:input_2E_87(1,77,768)*output:onnx_3A__3A_Sub_5F_1921(1,77,1)*axes:-1
Sub_734:Sub*input:input_2E_87(1,77,768);onnx_3A__3A_Sub_5F_1921(1,77,1)*output:onnx_3A__3A_Pow_5F_1922(1,77,768)
Pow_736:Pow*input:onnx_3A__3A_Pow_5F_1922(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1924(1,77,768)
ReduceMean_737:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1924(1,77,768)*output:onnx_3A__3A_Add_5F_1925(1,77,1)*axes:-1
Add_739:Add*input:onnx_3A__3A_Add_5F_1925(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1927(1,77,1)
Sqrt_740:Sqrt*input:onnx_3A__3A_Sqrt_5F_1927(1,77,1)*output:onnx_3A__3A_Div_5F_1928(1,77,1)
Div_741:Div*input:onnx_3A__3A_Pow_5F_1922(1,77,768);onnx_3A__3A_Div_5F_1928(1,77,1)*output:onnx_3A__3A_Mul_5F_1929(1,77,768)
Mul_742:Mul*input:onnx_3A__3A_Mul_5F_1929(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1930(1,77,768)
Add_743:Add*input:onnx_3A__3A_Add_5F_1930(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1931(1,77,768)
MatMul_744:MatMul*input:onnx_3A__3A_MatMul_5F_1931(1,77,768);onnx_3A__3A_MatMul_5F_2786.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1936(1,77,768)
Add_745:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1936(1,77,768)*output:onnx_3A__3A_Mul_5F_1937(1,77,768)
Mul_747:Mul*input:onnx_3A__3A_Mul_5F_1937(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_39(1,77,768)
MatMul_748:MatMul*input:onnx_3A__3A_MatMul_5F_1931(1,77,768);onnx_3A__3A_MatMul_5F_2787.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1941(1,77,768)
Add_749:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1941(1,77,768)*output:onnx_3A__3A_Reshape_5F_1942(1,77,768)
Reshape_750:Reshape*input:onnx_3A__3A_Reshape_5F_1942(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1955(1,77,12,64)*allowzero:0
Transpose_751:Transpose*input:onnx_3A__3A_Transpose_5F_1955(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1956(1,12,77,64)*perm:0,2,1,3
MatMul_752:MatMul*input:onnx_3A__3A_MatMul_5F_1931(1,77,768);onnx_3A__3A_MatMul_5F_2793.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1958(1,77,768)
Add_753:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1958(1,77,768)*output:onnx_3A__3A_Reshape_5F_1959(1,77,768)
Reshape_754:Reshape*input:onnx_3A__3A_Reshape_5F_1959(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1972(1,77,12,64)*allowzero:0
Transpose_755:Transpose*input:onnx_3A__3A_Transpose_5F_1972(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1973(1,12,77,64)*perm:0,2,1,3
Reshape_756:Reshape*input:query_5F_states_2E_39(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1986(1,77,12,64)*allowzero:0
Transpose_757:Transpose*input:onnx_3A__3A_Transpose_5F_1986(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1987(1,12,77,64)*perm:0,2,1,3
Reshape_758:Reshape*input:onnx_3A__3A_Reshape_5F_1987(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1997(12,77,64)*allowzero:0
Reshape_759:Reshape*input:onnx_3A__3A_Reshape_5F_1956(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_2007(12,77,64)*allowzero:0
Reshape_760:Reshape*input:onnx_3A__3A_Reshape_5F_1973(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2017(12,77,64)*allowzero:0
Transpose_761:Transpose*input:onnx_3A__3A_Transpose_5F_2007(12,77,64)*output:onnx_3A__3A_MatMul_5F_2019(12,64,77)*perm:0,2,1
MatMul_762:MatMul*input:onnx_3A__3A_MatMul_5F_1997(12,77,64);onnx_3A__3A_MatMul_5F_2019(12,64,77)*output:onnx_3A__3A_Reshape_5F_2020(12,77,77)
Reshape_763:Reshape*input:onnx_3A__3A_Reshape_5F_2020(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_2031(1,12,77,77)*allowzero:0
Add_764:Add*input:onnx_3A__3A_Add_5F_2031(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_2032(1,12,77,77)
Reshape_765:Reshape*input:onnx_3A__3A_Reshape_5F_2032(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_79(12,77,77)*allowzero:0
Softmax_766:Softmax*input:attn_5F_weights_2E_79(12,77,77)*output:attn_5F_weights_2E_83(12,77,77)*axis:-1
MatMul_767:MatMul*input:attn_5F_weights_2E_83(12,77,77);onnx_3A__3A_MatMul_5F_2017(12,77,64)*output:onnx_3A__3A_Reshape_5F_2043(12,77,64)
Reshape_768:Reshape*input:onnx_3A__3A_Reshape_5F_2043(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2055(1,12,77,64)*allowzero:0
Transpose_769:Transpose*input:onnx_3A__3A_Transpose_5F_2055(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_2056(1,77,12,64)*perm:0,2,1,3
Reshape_770:Reshape*input:onnx_3A__3A_Reshape_5F_2056(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2064(1,77,768)*allowzero:0
MatMul_771:MatMul*input:onnx_3A__3A_MatMul_5F_2064(1,77,768);onnx_3A__3A_MatMul_5F_2834.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2066(1,77,768)
Add_772:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2066(1,77,768)*output:onnx_3A__3A_Add_5F_2067(1,77,768)
Add_773:Add*input:input_2E_87(1,77,768);onnx_3A__3A_Add_5F_2067(1,77,768)*output:input_2E_91(1,77,768)
ReduceMean_774:ReduceMean*input:input_2E_91(1,77,768)*output:onnx_3A__3A_Sub_5F_2069(1,77,1)*axes:-1
Sub_775:Sub*input:input_2E_91(1,77,768);onnx_3A__3A_Sub_5F_2069(1,77,1)*output:onnx_3A__3A_Pow_5F_2070(1,77,768)
Pow_777:Pow*input:onnx_3A__3A_Pow_5F_2070(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_2072(1,77,768)
ReduceMean_778:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_2072(1,77,768)*output:onnx_3A__3A_Add_5F_2073(1,77,1)*axes:-1
Add_780:Add*input:onnx_3A__3A_Add_5F_2073(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_2075(1,77,1)
Sqrt_781:Sqrt*input:onnx_3A__3A_Sqrt_5F_2075(1,77,1)*output:onnx_3A__3A_Div_5F_2076(1,77,1)
Div_782:Div*input:onnx_3A__3A_Pow_5F_2070(1,77,768);onnx_3A__3A_Div_5F_2076(1,77,1)*output:onnx_3A__3A_Mul_5F_2077(1,77,768)
Mul_783:Mul*input:onnx_3A__3A_Mul_5F_2077(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_2078(1,77,768)
Add_784:Add*input:onnx_3A__3A_Add_5F_2078(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_2079(1,77,768)
MatMul_785:MatMul*input:onnx_3A__3A_MatMul_5F_2079(1,77,768);onnx_3A__3A_MatMul_5F_2835.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_2081(1,77,3072)
Add_786:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_2081(1,77,3072)*output:onnx_3A__3A_Mul_5F_2082(1,77,3072)
Mul_788:Mul*input:onnx_3A__3A_Mul_5F_2082(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_2084(1,77,3072)
Sigmoid_789:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_2084(1,77,3072)*output:onnx_3A__3A_Mul_5F_2085(1,77,3072)
Mul_790:Mul*input:onnx_3A__3A_Mul_5F_2082(1,77,3072);onnx_3A__3A_Mul_5F_2085(1,77,3072)*output:onnx_3A__3A_MatMul_5F_2086(1,77,3072)
MatMul_791:MatMul*input:onnx_3A__3A_MatMul_5F_2086(1,77,3072);onnx_3A__3A_MatMul_5F_2836.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_2088(1,77,768)
Add_792:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2088(1,77,768)*output:onnx_3A__3A_Add_5F_2089(1,77,768)
Add_793:Add*input:input_2E_91(1,77,768);onnx_3A__3A_Add_5F_2089(1,77,768)*output:input_2E_95(1,77,768)
ReduceMean_794:ReduceMean*input:input_2E_95(1,77,768)*output:onnx_3A__3A_Sub_5F_2091(1,77,1)*axes:-1
Sub_795:Sub*input:input_2E_95(1,77,768);onnx_3A__3A_Sub_5F_2091(1,77,1)*output:onnx_3A__3A_Pow_5F_2092(1,77,768)
Pow_797:Pow*input:onnx_3A__3A_Pow_5F_2092(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_2094(1,77,768)
ReduceMean_798:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_2094(1,77,768)*output:onnx_3A__3A_Add_5F_2095(1,77,1)*axes:-1
Add_800:Add*input:onnx_3A__3A_Add_5F_2095(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_2097(1,77,1)
Sqrt_801:Sqrt*input:onnx_3A__3A_Sqrt_5F_2097(1,77,1)*output:onnx_3A__3A_Div_5F_2098(1,77,1)
Div_802:Div*input:onnx_3A__3A_Pow_5F_2092(1,77,768);onnx_3A__3A_Div_5F_2098(1,77,1)*output:onnx_3A__3A_Mul_5F_2099(1,77,768)
Mul_803:Mul*input:onnx_3A__3A_Mul_5F_2099(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_2100(1,77,768)
Add_804:Add*input:onnx_3A__3A_Add_5F_2100(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_2101(1,77,768)
MatMul_805:MatMul*input:onnx_3A__3A_MatMul_5F_2101(1,77,768);onnx_3A__3A_MatMul_5F_2837.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2106(1,77,768)
Add_806:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2106(1,77,768)*output:onnx_3A__3A_Mul_5F_2107(1,77,768)
Mul_808:Mul*input:onnx_3A__3A_Mul_5F_2107(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_43(1,77,768)
MatMul_809:MatMul*input:onnx_3A__3A_MatMul_5F_2101(1,77,768);onnx_3A__3A_MatMul_5F_2838.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2111(1,77,768)
Add_810:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2111(1,77,768)*output:onnx_3A__3A_Reshape_5F_2112(1,77,768)
Reshape_811:Reshape*input:onnx_3A__3A_Reshape_5F_2112(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2125(1,77,12,64)*allowzero:0
Transpose_812:Transpose*input:onnx_3A__3A_Transpose_5F_2125(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_2126(1,12,77,64)*perm:0,2,1,3
MatMul_813:MatMul*input:onnx_3A__3A_MatMul_5F_2101(1,77,768);onnx_3A__3A_MatMul_5F_2844.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2128(1,77,768)
Add_814:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2128(1,77,768)*output:onnx_3A__3A_Reshape_5F_2129(1,77,768)
Reshape_815:Reshape*input:onnx_3A__3A_Reshape_5F_2129(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2142(1,77,12,64)*allowzero:0
Transpose_816:Transpose*input:onnx_3A__3A_Transpose_5F_2142(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_2143(1,12,77,64)*perm:0,2,1,3
Reshape_817:Reshape*input:query_5F_states_2E_43(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2156(1,77,12,64)*allowzero:0
Transpose_818:Transpose*input:onnx_3A__3A_Transpose_5F_2156(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_2157(1,12,77,64)*perm:0,2,1,3
Reshape_819:Reshape*input:onnx_3A__3A_Reshape_5F_2157(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2167(12,77,64)*allowzero:0
Reshape_820:Reshape*input:onnx_3A__3A_Reshape_5F_2126(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_2177(12,77,64)*allowzero:0
Reshape_821:Reshape*input:onnx_3A__3A_Reshape_5F_2143(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2187(12,77,64)*allowzero:0
Transpose_822:Transpose*input:onnx_3A__3A_Transpose_5F_2177(12,77,64)*output:onnx_3A__3A_MatMul_5F_2189(12,64,77)*perm:0,2,1
MatMul_823:MatMul*input:onnx_3A__3A_MatMul_5F_2167(12,77,64);onnx_3A__3A_MatMul_5F_2189(12,64,77)*output:onnx_3A__3A_Reshape_5F_2190(12,77,77)
Reshape_824:Reshape*input:onnx_3A__3A_Reshape_5F_2190(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_2201(1,12,77,77)*allowzero:0
Add_825:Add*input:onnx_3A__3A_Add_5F_2201(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_2202(1,12,77,77)
Reshape_826:Reshape*input:onnx_3A__3A_Reshape_5F_2202(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_87(12,77,77)*allowzero:0
Softmax_827:Softmax*input:attn_5F_weights_2E_87(12,77,77)*output:attn_5F_weights_2E_91(12,77,77)*axis:-1
MatMul_828:MatMul*input:attn_5F_weights_2E_91(12,77,77);onnx_3A__3A_MatMul_5F_2187(12,77,64)*output:onnx_3A__3A_Reshape_5F_2213(12,77,64)
Reshape_829:Reshape*input:onnx_3A__3A_Reshape_5F_2213(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2225(1,12,77,64)*allowzero:0
Transpose_830:Transpose*input:onnx_3A__3A_Transpose_5F_2225(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_2226(1,77,12,64)*perm:0,2,1,3
Reshape_831:Reshape*input:onnx_3A__3A_Reshape_5F_2226(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2234(1,77,768)*allowzero:0
MatMul_832:MatMul*input:onnx_3A__3A_MatMul_5F_2234(1,77,768);onnx_3A__3A_MatMul_5F_2885.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2236(1,77,768)
Add_833:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2236(1,77,768)*output:onnx_3A__3A_Add_5F_2237(1,77,768)
Add_834:Add*input:input_2E_95(1,77,768);onnx_3A__3A_Add_5F_2237(1,77,768)*output:input_2E_99(1,77,768)
ReduceMean_835:ReduceMean*input:input_2E_99(1,77,768)*output:onnx_3A__3A_Sub_5F_2239(1,77,1)*axes:-1
Sub_836:Sub*input:input_2E_99(1,77,768);onnx_3A__3A_Sub_5F_2239(1,77,1)*output:onnx_3A__3A_Pow_5F_2240(1,77,768)
Pow_838:Pow*input:onnx_3A__3A_Pow_5F_2240(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_2242(1,77,768)
ReduceMean_839:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_2242(1,77,768)*output:onnx_3A__3A_Add_5F_2243(1,77,1)*axes:-1
Add_841:Add*input:onnx_3A__3A_Add_5F_2243(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_2245(1,77,1)
Sqrt_842:Sqrt*input:onnx_3A__3A_Sqrt_5F_2245(1,77,1)*output:onnx_3A__3A_Div_5F_2246(1,77,1)
Div_843:Div*input:onnx_3A__3A_Pow_5F_2240(1,77,768);onnx_3A__3A_Div_5F_2246(1,77,1)*output:onnx_3A__3A_Mul_5F_2247(1,77,768)
Mul_844:Mul*input:onnx_3A__3A_Mul_5F_2247(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_2248(1,77,768)
Add_845:Add*input:onnx_3A__3A_Add_5F_2248(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_2249(1,77,768)
MatMul_846:MatMul*input:onnx_3A__3A_MatMul_5F_2249(1,77,768);onnx_3A__3A_MatMul_5F_2886.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_2251(1,77,3072)
Add_847:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_2251(1,77,3072)*output:onnx_3A__3A_Mul_5F_2252(1,77,3072)
Mul_849:Mul*input:onnx_3A__3A_Mul_5F_2252(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_2254(1,77,3072)
Sigmoid_850:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_2254(1,77,3072)*output:onnx_3A__3A_Mul_5F_2255(1,77,3072)
Mul_851:Mul*input:onnx_3A__3A_Mul_5F_2252(1,77,3072);onnx_3A__3A_Mul_5F_2255(1,77,3072)*output:onnx_3A__3A_MatMul_5F_2256(1,77,3072)
MatMul_852:MatMul*input:onnx_3A__3A_MatMul_5F_2256(1,77,3072);onnx_3A__3A_MatMul_5F_2887.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_2258(1,77,768)
Add_853:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2258(1,77,768)*output:onnx_3A__3A_Add_5F_2259(1,77,768)
Add_854:Add*input:input_2E_99(1,77,768);onnx_3A__3A_Add_5F_2259(1,77,768)*output:input_2E_103(1,77,768)
ReduceMean_855:ReduceMean*input:input_2E_103(1,77,768)*output:onnx_3A__3A_Sub_5F_2261(1,77,1)*axes:-1
Sub_856:Sub*input:input_2E_103(1,77,768);onnx_3A__3A_Sub_5F_2261(1,77,1)*output:onnx_3A__3A_Pow_5F_2262(1,77,768)
Pow_858:Pow*input:onnx_3A__3A_Pow_5F_2262(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_2264(1,77,768)
ReduceMean_859:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_2264(1,77,768)*output:onnx_3A__3A_Add_5F_2265(1,77,1)*axes:-1
Add_861:Add*input:onnx_3A__3A_Add_5F_2265(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_2267(1,77,1)
Sqrt_862:Sqrt*input:onnx_3A__3A_Sqrt_5F_2267(1,77,1)*output:onnx_3A__3A_Div_5F_2268(1,77,1)
Div_863:Div*input:onnx_3A__3A_Pow_5F_2262(1,77,768);onnx_3A__3A_Div_5F_2268(1,77,1)*output:onnx_3A__3A_Mul_5F_2269(1,77,768)
Mul_864:Mul*input:onnx_3A__3A_Mul_5F_2269(1,77,768);text_5F_model_2E_final_5F_layer_5F_norm_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_2270(1,77,768)
Add_865:Add*input:onnx_3A__3A_Add_5F_2270(1,77,768);text_5F_model_2E_final_5F_layer_5F_norm_2E_bias.bin(float32:768)*output:2271(1,77,768)