diff --git "a/text_encoder_fp32/model.txt" "b/text_encoder_fp32/model.txt" --- "a/text_encoder_fp32/model.txt" +++ "b/text_encoder_fp32/model.txt" @@ -1,672 +1,672 @@ -Reshape_113:Reshape*input:onnx_3A__3A_Reshape_5F_0(1,77);onnx_3A__3A_Reshape_5F_2274.bin(int64:2)*output:input(1,77)*allowzero:0 -Gather_114:Gather*input:text_5F_model_2E_embeddings_2E_token_5F_embedding_2E_wrapped_2E_weight.bin(float32:49408,768);input(1,77)*output:onnx_3A__3A_Add_5F_212(1,77,768) -Add_116:Add*input:onnx_3A__3A_Add_5F_212(1,77,768);onnx_3A__3A_Add_5F_213.bin(float32:1,77,768)*output:input_2E_7(1,77,768) -ReduceMean_123:ReduceMean*input:input_2E_7(1,77,768)*output:onnx_3A__3A_Sub_5F_221(1,77,1)*axes:-1 -Sub_124:Sub*input:input_2E_7(1,77,768);onnx_3A__3A_Sub_5F_221(1,77,1)*output:onnx_3A__3A_Pow_5F_222(1,77,768) -Pow_126:Pow*input:onnx_3A__3A_Pow_5F_222(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_224(1,77,768) -ReduceMean_127:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_224(1,77,768)*output:onnx_3A__3A_Add_5F_225(1,77,1)*axes:-1 -Add_129:Add*input:onnx_3A__3A_Add_5F_225(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_227(1,77,1) -Sqrt_130:Sqrt*input:onnx_3A__3A_Sqrt_5F_227(1,77,1)*output:onnx_3A__3A_Div_5F_228(1,77,1) -Div_131:Div*input:onnx_3A__3A_Pow_5F_222(1,77,768);onnx_3A__3A_Div_5F_228(1,77,1)*output:onnx_3A__3A_Mul_5F_229(1,77,768) -Mul_132:Mul*input:onnx_3A__3A_Mul_5F_229(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_230(1,77,768) -Add_133:Add*input:onnx_3A__3A_Add_5F_230(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_231(1,77,768) -MatMul_134:MatMul*input:onnx_3A__3A_MatMul_5F_231(1,77,768);onnx_3A__3A_MatMul_5F_2276.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_236(1,77,768) -Add_135:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_236(1,77,768)*output:onnx_3A__3A_Mul_5F_237(1,77,768) -Mul_137:Mul*input:onnx_3A__3A_Mul_5F_237(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states(1,77,768) -MatMul_138:MatMul*input:onnx_3A__3A_MatMul_5F_231(1,77,768);onnx_3A__3A_MatMul_5F_2277.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_241(1,77,768) -Add_139:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_241(1,77,768)*output:onnx_3A__3A_Reshape_5F_242(1,77,768) -Reshape_140:Reshape*input:onnx_3A__3A_Reshape_5F_242(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_255(1,77,12,64)*allowzero:0 -Transpose_141:Transpose*input:onnx_3A__3A_Transpose_5F_255(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_256(1,12,77,64)*perm:0,2,1,3 -MatMul_142:MatMul*input:onnx_3A__3A_MatMul_5F_231(1,77,768);onnx_3A__3A_MatMul_5F_2283.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_258(1,77,768) -Add_143:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_258(1,77,768)*output:onnx_3A__3A_Reshape_5F_259(1,77,768) -Reshape_144:Reshape*input:onnx_3A__3A_Reshape_5F_259(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_272(1,77,12,64)*allowzero:0 -Transpose_145:Transpose*input:onnx_3A__3A_Transpose_5F_272(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_273(1,12,77,64)*perm:0,2,1,3 -Reshape_146:Reshape*input:query_5F_states(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_286(1,77,12,64)*allowzero:0 -Transpose_147:Transpose*input:onnx_3A__3A_Transpose_5F_286(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_287(1,12,77,64)*perm:0,2,1,3 -Reshape_148:Reshape*input:onnx_3A__3A_Reshape_5F_287(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_297(12,77,64)*allowzero:0 -Reshape_149:Reshape*input:onnx_3A__3A_Reshape_5F_256(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_307(12,77,64)*allowzero:0 -Reshape_150:Reshape*input:onnx_3A__3A_Reshape_5F_273(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_317(12,77,64)*allowzero:0 -Transpose_151:Transpose*input:onnx_3A__3A_Transpose_5F_307(12,77,64)*output:onnx_3A__3A_MatMul_5F_319(12,64,77)*perm:0,2,1 -MatMul_152:MatMul*input:onnx_3A__3A_MatMul_5F_297(12,77,64);onnx_3A__3A_MatMul_5F_319(12,64,77)*output:onnx_3A__3A_Reshape_5F_320(12,77,77) -Reshape_153:Reshape*input:onnx_3A__3A_Reshape_5F_320(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_331(1,12,77,77)*allowzero:0 -Add_154:Add*input:onnx_3A__3A_Add_5F_331(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_332(1,12,77,77) -Reshape_155:Reshape*input:onnx_3A__3A_Reshape_5F_332(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights(12,77,77)*allowzero:0 -Softmax_156:Softmax*input:attn_5F_weights(12,77,77)*output:attn_5F_weights_2E_3(12,77,77)*axis:-1 -MatMul_157:MatMul*input:attn_5F_weights_2E_3(12,77,77);onnx_3A__3A_MatMul_5F_317(12,77,64)*output:onnx_3A__3A_Reshape_5F_343(12,77,64) -Reshape_158:Reshape*input:onnx_3A__3A_Reshape_5F_343(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_355(1,12,77,64)*allowzero:0 -Transpose_159:Transpose*input:onnx_3A__3A_Transpose_5F_355(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_356(1,77,12,64)*perm:0,2,1,3 -Reshape_160:Reshape*input:onnx_3A__3A_Reshape_5F_356(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_364(1,77,768)*allowzero:0 -MatMul_161:MatMul*input:onnx_3A__3A_MatMul_5F_364(1,77,768);onnx_3A__3A_MatMul_5F_2324.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_366(1,77,768) -Add_162:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_366(1,77,768)*output:onnx_3A__3A_Add_5F_367(1,77,768) -Add_163:Add*input:input_2E_7(1,77,768);onnx_3A__3A_Add_5F_367(1,77,768)*output:input_2E_11(1,77,768) -ReduceMean_164:ReduceMean*input:input_2E_11(1,77,768)*output:onnx_3A__3A_Sub_5F_369(1,77,1)*axes:-1 -Sub_165:Sub*input:input_2E_11(1,77,768);onnx_3A__3A_Sub_5F_369(1,77,1)*output:onnx_3A__3A_Pow_5F_370(1,77,768) -Pow_167:Pow*input:onnx_3A__3A_Pow_5F_370(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_372(1,77,768) -ReduceMean_168:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_372(1,77,768)*output:onnx_3A__3A_Add_5F_373(1,77,1)*axes:-1 -Add_170:Add*input:onnx_3A__3A_Add_5F_373(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_375(1,77,1) -Sqrt_171:Sqrt*input:onnx_3A__3A_Sqrt_5F_375(1,77,1)*output:onnx_3A__3A_Div_5F_376(1,77,1) -Div_172:Div*input:onnx_3A__3A_Pow_5F_370(1,77,768);onnx_3A__3A_Div_5F_376(1,77,1)*output:onnx_3A__3A_Mul_5F_377(1,77,768) -Mul_173:Mul*input:onnx_3A__3A_Mul_5F_377(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_378(1,77,768) -Add_174:Add*input:onnx_3A__3A_Add_5F_378(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_379(1,77,768) -MatMul_175:MatMul*input:onnx_3A__3A_MatMul_5F_379(1,77,768);onnx_3A__3A_MatMul_5F_2325.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_381(1,77,3072) -Add_176:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_381(1,77,3072)*output:onnx_3A__3A_Mul_5F_382(1,77,3072) -Mul_178:Mul*input:onnx_3A__3A_Mul_5F_382(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_384(1,77,3072) -Sigmoid_179:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_384(1,77,3072)*output:onnx_3A__3A_Mul_5F_385(1,77,3072) -Mul_180:Mul*input:onnx_3A__3A_Mul_5F_382(1,77,3072);onnx_3A__3A_Mul_5F_385(1,77,3072)*output:onnx_3A__3A_MatMul_5F_386(1,77,3072) -MatMul_181:MatMul*input:onnx_3A__3A_MatMul_5F_386(1,77,3072);onnx_3A__3A_MatMul_5F_2326.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_388(1,77,768) -Add_182:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_388(1,77,768)*output:onnx_3A__3A_Add_5F_389(1,77,768) -Add_183:Add*input:input_2E_11(1,77,768);onnx_3A__3A_Add_5F_389(1,77,768)*output:input_2E_15(1,77,768) -ReduceMean_184:ReduceMean*input:input_2E_15(1,77,768)*output:onnx_3A__3A_Sub_5F_391(1,77,1)*axes:-1 -Sub_185:Sub*input:input_2E_15(1,77,768);onnx_3A__3A_Sub_5F_391(1,77,1)*output:onnx_3A__3A_Pow_5F_392(1,77,768) -Pow_187:Pow*input:onnx_3A__3A_Pow_5F_392(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_394(1,77,768) -ReduceMean_188:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_394(1,77,768)*output:onnx_3A__3A_Add_5F_395(1,77,1)*axes:-1 -Add_190:Add*input:onnx_3A__3A_Add_5F_395(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_397(1,77,1) -Sqrt_191:Sqrt*input:onnx_3A__3A_Sqrt_5F_397(1,77,1)*output:onnx_3A__3A_Div_5F_398(1,77,1) -Div_192:Div*input:onnx_3A__3A_Pow_5F_392(1,77,768);onnx_3A__3A_Div_5F_398(1,77,1)*output:onnx_3A__3A_Mul_5F_399(1,77,768) -Mul_193:Mul*input:onnx_3A__3A_Mul_5F_399(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_400(1,77,768) -Add_194:Add*input:onnx_3A__3A_Add_5F_400(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_401(1,77,768) -MatMul_195:MatMul*input:onnx_3A__3A_MatMul_5F_401(1,77,768);onnx_3A__3A_MatMul_5F_2327.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_406(1,77,768) -Add_196:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_406(1,77,768)*output:onnx_3A__3A_Mul_5F_407(1,77,768) -Mul_198:Mul*input:onnx_3A__3A_Mul_5F_407(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_3(1,77,768) -MatMul_199:MatMul*input:onnx_3A__3A_MatMul_5F_401(1,77,768);onnx_3A__3A_MatMul_5F_2328.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_411(1,77,768) -Add_200:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_411(1,77,768)*output:onnx_3A__3A_Reshape_5F_412(1,77,768) -Reshape_201:Reshape*input:onnx_3A__3A_Reshape_5F_412(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_425(1,77,12,64)*allowzero:0 -Transpose_202:Transpose*input:onnx_3A__3A_Transpose_5F_425(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_426(1,12,77,64)*perm:0,2,1,3 -MatMul_203:MatMul*input:onnx_3A__3A_MatMul_5F_401(1,77,768);onnx_3A__3A_MatMul_5F_2334.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_428(1,77,768) -Add_204:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_428(1,77,768)*output:onnx_3A__3A_Reshape_5F_429(1,77,768) -Reshape_205:Reshape*input:onnx_3A__3A_Reshape_5F_429(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_442(1,77,12,64)*allowzero:0 -Transpose_206:Transpose*input:onnx_3A__3A_Transpose_5F_442(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_443(1,12,77,64)*perm:0,2,1,3 -Reshape_207:Reshape*input:query_5F_states_2E_3(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_456(1,77,12,64)*allowzero:0 -Transpose_208:Transpose*input:onnx_3A__3A_Transpose_5F_456(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_457(1,12,77,64)*perm:0,2,1,3 -Reshape_209:Reshape*input:onnx_3A__3A_Reshape_5F_457(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_467(12,77,64)*allowzero:0 -Reshape_210:Reshape*input:onnx_3A__3A_Reshape_5F_426(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_477(12,77,64)*allowzero:0 -Reshape_211:Reshape*input:onnx_3A__3A_Reshape_5F_443(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_487(12,77,64)*allowzero:0 -Transpose_212:Transpose*input:onnx_3A__3A_Transpose_5F_477(12,77,64)*output:onnx_3A__3A_MatMul_5F_489(12,64,77)*perm:0,2,1 -MatMul_213:MatMul*input:onnx_3A__3A_MatMul_5F_467(12,77,64);onnx_3A__3A_MatMul_5F_489(12,64,77)*output:onnx_3A__3A_Reshape_5F_490(12,77,77) -Reshape_214:Reshape*input:onnx_3A__3A_Reshape_5F_490(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_501(1,12,77,77)*allowzero:0 -Add_215:Add*input:onnx_3A__3A_Add_5F_501(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_502(1,12,77,77) -Reshape_216:Reshape*input:onnx_3A__3A_Reshape_5F_502(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_7(12,77,77)*allowzero:0 -Softmax_217:Softmax*input:attn_5F_weights_2E_7(12,77,77)*output:attn_5F_weights_2E_11(12,77,77)*axis:-1 -MatMul_218:MatMul*input:attn_5F_weights_2E_11(12,77,77);onnx_3A__3A_MatMul_5F_487(12,77,64)*output:onnx_3A__3A_Reshape_5F_513(12,77,64) -Reshape_219:Reshape*input:onnx_3A__3A_Reshape_5F_513(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_525(1,12,77,64)*allowzero:0 -Transpose_220:Transpose*input:onnx_3A__3A_Transpose_5F_525(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_526(1,77,12,64)*perm:0,2,1,3 -Reshape_221:Reshape*input:onnx_3A__3A_Reshape_5F_526(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_534(1,77,768)*allowzero:0 -MatMul_222:MatMul*input:onnx_3A__3A_MatMul_5F_534(1,77,768);onnx_3A__3A_MatMul_5F_2375.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_536(1,77,768) -Add_223:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_536(1,77,768)*output:onnx_3A__3A_Add_5F_537(1,77,768) -Add_224:Add*input:input_2E_15(1,77,768);onnx_3A__3A_Add_5F_537(1,77,768)*output:input_2E_19(1,77,768) -ReduceMean_225:ReduceMean*input:input_2E_19(1,77,768)*output:onnx_3A__3A_Sub_5F_539(1,77,1)*axes:-1 -Sub_226:Sub*input:input_2E_19(1,77,768);onnx_3A__3A_Sub_5F_539(1,77,1)*output:onnx_3A__3A_Pow_5F_540(1,77,768) -Pow_228:Pow*input:onnx_3A__3A_Pow_5F_540(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_542(1,77,768) -ReduceMean_229:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_542(1,77,768)*output:onnx_3A__3A_Add_5F_543(1,77,1)*axes:-1 -Add_231:Add*input:onnx_3A__3A_Add_5F_543(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_545(1,77,1) -Sqrt_232:Sqrt*input:onnx_3A__3A_Sqrt_5F_545(1,77,1)*output:onnx_3A__3A_Div_5F_546(1,77,1) -Div_233:Div*input:onnx_3A__3A_Pow_5F_540(1,77,768);onnx_3A__3A_Div_5F_546(1,77,1)*output:onnx_3A__3A_Mul_5F_547(1,77,768) -Mul_234:Mul*input:onnx_3A__3A_Mul_5F_547(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_548(1,77,768) -Add_235:Add*input:onnx_3A__3A_Add_5F_548(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_549(1,77,768) -MatMul_236:MatMul*input:onnx_3A__3A_MatMul_5F_549(1,77,768);onnx_3A__3A_MatMul_5F_2376.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_551(1,77,3072) -Add_237:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_551(1,77,3072)*output:onnx_3A__3A_Mul_5F_552(1,77,3072) -Mul_239:Mul*input:onnx_3A__3A_Mul_5F_552(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_554(1,77,3072) -Sigmoid_240:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_554(1,77,3072)*output:onnx_3A__3A_Mul_5F_555(1,77,3072) -Mul_241:Mul*input:onnx_3A__3A_Mul_5F_552(1,77,3072);onnx_3A__3A_Mul_5F_555(1,77,3072)*output:onnx_3A__3A_MatMul_5F_556(1,77,3072) -MatMul_242:MatMul*input:onnx_3A__3A_MatMul_5F_556(1,77,3072);onnx_3A__3A_MatMul_5F_2377.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_558(1,77,768) -Add_243:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_558(1,77,768)*output:onnx_3A__3A_Add_5F_559(1,77,768) -Add_244:Add*input:input_2E_19(1,77,768);onnx_3A__3A_Add_5F_559(1,77,768)*output:input_2E_23(1,77,768) -ReduceMean_245:ReduceMean*input:input_2E_23(1,77,768)*output:onnx_3A__3A_Sub_5F_561(1,77,1)*axes:-1 -Sub_246:Sub*input:input_2E_23(1,77,768);onnx_3A__3A_Sub_5F_561(1,77,1)*output:onnx_3A__3A_Pow_5F_562(1,77,768) -Pow_248:Pow*input:onnx_3A__3A_Pow_5F_562(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_564(1,77,768) -ReduceMean_249:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_564(1,77,768)*output:onnx_3A__3A_Add_5F_565(1,77,1)*axes:-1 -Add_251:Add*input:onnx_3A__3A_Add_5F_565(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_567(1,77,1) -Sqrt_252:Sqrt*input:onnx_3A__3A_Sqrt_5F_567(1,77,1)*output:onnx_3A__3A_Div_5F_568(1,77,1) -Div_253:Div*input:onnx_3A__3A_Pow_5F_562(1,77,768);onnx_3A__3A_Div_5F_568(1,77,1)*output:onnx_3A__3A_Mul_5F_569(1,77,768) -Mul_254:Mul*input:onnx_3A__3A_Mul_5F_569(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_570(1,77,768) -Add_255:Add*input:onnx_3A__3A_Add_5F_570(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_571(1,77,768) -MatMul_256:MatMul*input:onnx_3A__3A_MatMul_5F_571(1,77,768);onnx_3A__3A_MatMul_5F_2378.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_576(1,77,768) -Add_257:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_576(1,77,768)*output:onnx_3A__3A_Mul_5F_577(1,77,768) -Mul_259:Mul*input:onnx_3A__3A_Mul_5F_577(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_7(1,77,768) -MatMul_260:MatMul*input:onnx_3A__3A_MatMul_5F_571(1,77,768);onnx_3A__3A_MatMul_5F_2379.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_581(1,77,768) -Add_261:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_581(1,77,768)*output:onnx_3A__3A_Reshape_5F_582(1,77,768) -Reshape_262:Reshape*input:onnx_3A__3A_Reshape_5F_582(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_595(1,77,12,64)*allowzero:0 -Transpose_263:Transpose*input:onnx_3A__3A_Transpose_5F_595(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_596(1,12,77,64)*perm:0,2,1,3 -MatMul_264:MatMul*input:onnx_3A__3A_MatMul_5F_571(1,77,768);onnx_3A__3A_MatMul_5F_2385.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_598(1,77,768) -Add_265:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_598(1,77,768)*output:onnx_3A__3A_Reshape_5F_599(1,77,768) -Reshape_266:Reshape*input:onnx_3A__3A_Reshape_5F_599(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_612(1,77,12,64)*allowzero:0 -Transpose_267:Transpose*input:onnx_3A__3A_Transpose_5F_612(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_613(1,12,77,64)*perm:0,2,1,3 -Reshape_268:Reshape*input:query_5F_states_2E_7(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_626(1,77,12,64)*allowzero:0 -Transpose_269:Transpose*input:onnx_3A__3A_Transpose_5F_626(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_627(1,12,77,64)*perm:0,2,1,3 -Reshape_270:Reshape*input:onnx_3A__3A_Reshape_5F_627(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_637(12,77,64)*allowzero:0 -Reshape_271:Reshape*input:onnx_3A__3A_Reshape_5F_596(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_647(12,77,64)*allowzero:0 -Reshape_272:Reshape*input:onnx_3A__3A_Reshape_5F_613(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_657(12,77,64)*allowzero:0 -Transpose_273:Transpose*input:onnx_3A__3A_Transpose_5F_647(12,77,64)*output:onnx_3A__3A_MatMul_5F_659(12,64,77)*perm:0,2,1 -MatMul_274:MatMul*input:onnx_3A__3A_MatMul_5F_637(12,77,64);onnx_3A__3A_MatMul_5F_659(12,64,77)*output:onnx_3A__3A_Reshape_5F_660(12,77,77) -Reshape_275:Reshape*input:onnx_3A__3A_Reshape_5F_660(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_671(1,12,77,77)*allowzero:0 -Add_276:Add*input:onnx_3A__3A_Add_5F_671(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_672(1,12,77,77) -Reshape_277:Reshape*input:onnx_3A__3A_Reshape_5F_672(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_15(12,77,77)*allowzero:0 -Softmax_278:Softmax*input:attn_5F_weights_2E_15(12,77,77)*output:attn_5F_weights_2E_19(12,77,77)*axis:-1 -MatMul_279:MatMul*input:attn_5F_weights_2E_19(12,77,77);onnx_3A__3A_MatMul_5F_657(12,77,64)*output:onnx_3A__3A_Reshape_5F_683(12,77,64) -Reshape_280:Reshape*input:onnx_3A__3A_Reshape_5F_683(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_695(1,12,77,64)*allowzero:0 -Transpose_281:Transpose*input:onnx_3A__3A_Transpose_5F_695(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_696(1,77,12,64)*perm:0,2,1,3 -Reshape_282:Reshape*input:onnx_3A__3A_Reshape_5F_696(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_704(1,77,768)*allowzero:0 -MatMul_283:MatMul*input:onnx_3A__3A_MatMul_5F_704(1,77,768);onnx_3A__3A_MatMul_5F_2426.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_706(1,77,768) -Add_284:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_706(1,77,768)*output:onnx_3A__3A_Add_5F_707(1,77,768) -Add_285:Add*input:input_2E_23(1,77,768);onnx_3A__3A_Add_5F_707(1,77,768)*output:input_2E_27(1,77,768) -ReduceMean_286:ReduceMean*input:input_2E_27(1,77,768)*output:onnx_3A__3A_Sub_5F_709(1,77,1)*axes:-1 -Sub_287:Sub*input:input_2E_27(1,77,768);onnx_3A__3A_Sub_5F_709(1,77,1)*output:onnx_3A__3A_Pow_5F_710(1,77,768) -Pow_289:Pow*input:onnx_3A__3A_Pow_5F_710(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_712(1,77,768) -ReduceMean_290:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_712(1,77,768)*output:onnx_3A__3A_Add_5F_713(1,77,1)*axes:-1 -Add_292:Add*input:onnx_3A__3A_Add_5F_713(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_715(1,77,1) -Sqrt_293:Sqrt*input:onnx_3A__3A_Sqrt_5F_715(1,77,1)*output:onnx_3A__3A_Div_5F_716(1,77,1) -Div_294:Div*input:onnx_3A__3A_Pow_5F_710(1,77,768);onnx_3A__3A_Div_5F_716(1,77,1)*output:onnx_3A__3A_Mul_5F_717(1,77,768) -Mul_295:Mul*input:onnx_3A__3A_Mul_5F_717(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_718(1,77,768) -Add_296:Add*input:onnx_3A__3A_Add_5F_718(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_719(1,77,768) -MatMul_297:MatMul*input:onnx_3A__3A_MatMul_5F_719(1,77,768);onnx_3A__3A_MatMul_5F_2427.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_721(1,77,3072) -Add_298:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_721(1,77,3072)*output:onnx_3A__3A_Mul_5F_722(1,77,3072) -Mul_300:Mul*input:onnx_3A__3A_Mul_5F_722(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_724(1,77,3072) -Sigmoid_301:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_724(1,77,3072)*output:onnx_3A__3A_Mul_5F_725(1,77,3072) -Mul_302:Mul*input:onnx_3A__3A_Mul_5F_722(1,77,3072);onnx_3A__3A_Mul_5F_725(1,77,3072)*output:onnx_3A__3A_MatMul_5F_726(1,77,3072) -MatMul_303:MatMul*input:onnx_3A__3A_MatMul_5F_726(1,77,3072);onnx_3A__3A_MatMul_5F_2428.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_728(1,77,768) -Add_304:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_728(1,77,768)*output:onnx_3A__3A_Add_5F_729(1,77,768) -Add_305:Add*input:input_2E_27(1,77,768);onnx_3A__3A_Add_5F_729(1,77,768)*output:input_2E_31(1,77,768) -ReduceMean_306:ReduceMean*input:input_2E_31(1,77,768)*output:onnx_3A__3A_Sub_5F_731(1,77,1)*axes:-1 -Sub_307:Sub*input:input_2E_31(1,77,768);onnx_3A__3A_Sub_5F_731(1,77,1)*output:onnx_3A__3A_Pow_5F_732(1,77,768) -Pow_309:Pow*input:onnx_3A__3A_Pow_5F_732(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_734(1,77,768) -ReduceMean_310:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_734(1,77,768)*output:onnx_3A__3A_Add_5F_735(1,77,1)*axes:-1 -Add_312:Add*input:onnx_3A__3A_Add_5F_735(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_737(1,77,1) -Sqrt_313:Sqrt*input:onnx_3A__3A_Sqrt_5F_737(1,77,1)*output:onnx_3A__3A_Div_5F_738(1,77,1) -Div_314:Div*input:onnx_3A__3A_Pow_5F_732(1,77,768);onnx_3A__3A_Div_5F_738(1,77,1)*output:onnx_3A__3A_Mul_5F_739(1,77,768) -Mul_315:Mul*input:onnx_3A__3A_Mul_5F_739(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_740(1,77,768) -Add_316:Add*input:onnx_3A__3A_Add_5F_740(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_741(1,77,768) -MatMul_317:MatMul*input:onnx_3A__3A_MatMul_5F_741(1,77,768);onnx_3A__3A_MatMul_5F_2429.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_746(1,77,768) -Add_318:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_746(1,77,768)*output:onnx_3A__3A_Mul_5F_747(1,77,768) -Mul_320:Mul*input:onnx_3A__3A_Mul_5F_747(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_11(1,77,768) -MatMul_321:MatMul*input:onnx_3A__3A_MatMul_5F_741(1,77,768);onnx_3A__3A_MatMul_5F_2430.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_751(1,77,768) -Add_322:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_751(1,77,768)*output:onnx_3A__3A_Reshape_5F_752(1,77,768) -Reshape_323:Reshape*input:onnx_3A__3A_Reshape_5F_752(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_765(1,77,12,64)*allowzero:0 -Transpose_324:Transpose*input:onnx_3A__3A_Transpose_5F_765(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_766(1,12,77,64)*perm:0,2,1,3 -MatMul_325:MatMul*input:onnx_3A__3A_MatMul_5F_741(1,77,768);onnx_3A__3A_MatMul_5F_2436.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_768(1,77,768) -Add_326:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_768(1,77,768)*output:onnx_3A__3A_Reshape_5F_769(1,77,768) -Reshape_327:Reshape*input:onnx_3A__3A_Reshape_5F_769(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_782(1,77,12,64)*allowzero:0 -Transpose_328:Transpose*input:onnx_3A__3A_Transpose_5F_782(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_783(1,12,77,64)*perm:0,2,1,3 -Reshape_329:Reshape*input:query_5F_states_2E_11(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_796(1,77,12,64)*allowzero:0 -Transpose_330:Transpose*input:onnx_3A__3A_Transpose_5F_796(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_797(1,12,77,64)*perm:0,2,1,3 -Reshape_331:Reshape*input:onnx_3A__3A_Reshape_5F_797(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_807(12,77,64)*allowzero:0 -Reshape_332:Reshape*input:onnx_3A__3A_Reshape_5F_766(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_817(12,77,64)*allowzero:0 -Reshape_333:Reshape*input:onnx_3A__3A_Reshape_5F_783(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_827(12,77,64)*allowzero:0 -Transpose_334:Transpose*input:onnx_3A__3A_Transpose_5F_817(12,77,64)*output:onnx_3A__3A_MatMul_5F_829(12,64,77)*perm:0,2,1 -MatMul_335:MatMul*input:onnx_3A__3A_MatMul_5F_807(12,77,64);onnx_3A__3A_MatMul_5F_829(12,64,77)*output:onnx_3A__3A_Reshape_5F_830(12,77,77) -Reshape_336:Reshape*input:onnx_3A__3A_Reshape_5F_830(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_841(1,12,77,77)*allowzero:0 -Add_337:Add*input:onnx_3A__3A_Add_5F_841(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_842(1,12,77,77) -Reshape_338:Reshape*input:onnx_3A__3A_Reshape_5F_842(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_23(12,77,77)*allowzero:0 -Softmax_339:Softmax*input:attn_5F_weights_2E_23(12,77,77)*output:attn_5F_weights_2E_27(12,77,77)*axis:-1 -MatMul_340:MatMul*input:attn_5F_weights_2E_27(12,77,77);onnx_3A__3A_MatMul_5F_827(12,77,64)*output:onnx_3A__3A_Reshape_5F_853(12,77,64) -Reshape_341:Reshape*input:onnx_3A__3A_Reshape_5F_853(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_865(1,12,77,64)*allowzero:0 -Transpose_342:Transpose*input:onnx_3A__3A_Transpose_5F_865(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_866(1,77,12,64)*perm:0,2,1,3 -Reshape_343:Reshape*input:onnx_3A__3A_Reshape_5F_866(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_874(1,77,768)*allowzero:0 -MatMul_344:MatMul*input:onnx_3A__3A_MatMul_5F_874(1,77,768);onnx_3A__3A_MatMul_5F_2477.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_876(1,77,768) -Add_345:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_876(1,77,768)*output:onnx_3A__3A_Add_5F_877(1,77,768) -Add_346:Add*input:input_2E_31(1,77,768);onnx_3A__3A_Add_5F_877(1,77,768)*output:input_2E_35(1,77,768) -ReduceMean_347:ReduceMean*input:input_2E_35(1,77,768)*output:onnx_3A__3A_Sub_5F_879(1,77,1)*axes:-1 -Sub_348:Sub*input:input_2E_35(1,77,768);onnx_3A__3A_Sub_5F_879(1,77,1)*output:onnx_3A__3A_Pow_5F_880(1,77,768) -Pow_350:Pow*input:onnx_3A__3A_Pow_5F_880(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_882(1,77,768) -ReduceMean_351:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_882(1,77,768)*output:onnx_3A__3A_Add_5F_883(1,77,1)*axes:-1 -Add_353:Add*input:onnx_3A__3A_Add_5F_883(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_885(1,77,1) -Sqrt_354:Sqrt*input:onnx_3A__3A_Sqrt_5F_885(1,77,1)*output:onnx_3A__3A_Div_5F_886(1,77,1) -Div_355:Div*input:onnx_3A__3A_Pow_5F_880(1,77,768);onnx_3A__3A_Div_5F_886(1,77,1)*output:onnx_3A__3A_Mul_5F_887(1,77,768) -Mul_356:Mul*input:onnx_3A__3A_Mul_5F_887(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_888(1,77,768) -Add_357:Add*input:onnx_3A__3A_Add_5F_888(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_889(1,77,768) -MatMul_358:MatMul*input:onnx_3A__3A_MatMul_5F_889(1,77,768);onnx_3A__3A_MatMul_5F_2478.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_891(1,77,3072) -Add_359:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_891(1,77,3072)*output:onnx_3A__3A_Mul_5F_892(1,77,3072) -Mul_361:Mul*input:onnx_3A__3A_Mul_5F_892(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_894(1,77,3072) -Sigmoid_362:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_894(1,77,3072)*output:onnx_3A__3A_Mul_5F_895(1,77,3072) -Mul_363:Mul*input:onnx_3A__3A_Mul_5F_892(1,77,3072);onnx_3A__3A_Mul_5F_895(1,77,3072)*output:onnx_3A__3A_MatMul_5F_896(1,77,3072) -MatMul_364:MatMul*input:onnx_3A__3A_MatMul_5F_896(1,77,3072);onnx_3A__3A_MatMul_5F_2479.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_898(1,77,768) -Add_365:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_898(1,77,768)*output:onnx_3A__3A_Add_5F_899(1,77,768) -Add_366:Add*input:input_2E_35(1,77,768);onnx_3A__3A_Add_5F_899(1,77,768)*output:input_2E_39(1,77,768) -ReduceMean_367:ReduceMean*input:input_2E_39(1,77,768)*output:onnx_3A__3A_Sub_5F_901(1,77,1)*axes:-1 -Sub_368:Sub*input:input_2E_39(1,77,768);onnx_3A__3A_Sub_5F_901(1,77,1)*output:onnx_3A__3A_Pow_5F_902(1,77,768) -Pow_370:Pow*input:onnx_3A__3A_Pow_5F_902(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_904(1,77,768) -ReduceMean_371:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_904(1,77,768)*output:onnx_3A__3A_Add_5F_905(1,77,1)*axes:-1 -Add_373:Add*input:onnx_3A__3A_Add_5F_905(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_907(1,77,1) -Sqrt_374:Sqrt*input:onnx_3A__3A_Sqrt_5F_907(1,77,1)*output:onnx_3A__3A_Div_5F_908(1,77,1) -Div_375:Div*input:onnx_3A__3A_Pow_5F_902(1,77,768);onnx_3A__3A_Div_5F_908(1,77,1)*output:onnx_3A__3A_Mul_5F_909(1,77,768) -Mul_376:Mul*input:onnx_3A__3A_Mul_5F_909(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_910(1,77,768) -Add_377:Add*input:onnx_3A__3A_Add_5F_910(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_911(1,77,768) -MatMul_378:MatMul*input:onnx_3A__3A_MatMul_5F_911(1,77,768);onnx_3A__3A_MatMul_5F_2480.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_916(1,77,768) -Add_379:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_916(1,77,768)*output:onnx_3A__3A_Mul_5F_917(1,77,768) -Mul_381:Mul*input:onnx_3A__3A_Mul_5F_917(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_15(1,77,768) -MatMul_382:MatMul*input:onnx_3A__3A_MatMul_5F_911(1,77,768);onnx_3A__3A_MatMul_5F_2481.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_921(1,77,768) -Add_383:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_921(1,77,768)*output:onnx_3A__3A_Reshape_5F_922(1,77,768) -Reshape_384:Reshape*input:onnx_3A__3A_Reshape_5F_922(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_935(1,77,12,64)*allowzero:0 -Transpose_385:Transpose*input:onnx_3A__3A_Transpose_5F_935(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_936(1,12,77,64)*perm:0,2,1,3 -MatMul_386:MatMul*input:onnx_3A__3A_MatMul_5F_911(1,77,768);onnx_3A__3A_MatMul_5F_2487.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_938(1,77,768) -Add_387:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_938(1,77,768)*output:onnx_3A__3A_Reshape_5F_939(1,77,768) -Reshape_388:Reshape*input:onnx_3A__3A_Reshape_5F_939(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_952(1,77,12,64)*allowzero:0 -Transpose_389:Transpose*input:onnx_3A__3A_Transpose_5F_952(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_953(1,12,77,64)*perm:0,2,1,3 -Reshape_390:Reshape*input:query_5F_states_2E_15(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_966(1,77,12,64)*allowzero:0 -Transpose_391:Transpose*input:onnx_3A__3A_Transpose_5F_966(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_967(1,12,77,64)*perm:0,2,1,3 -Reshape_392:Reshape*input:onnx_3A__3A_Reshape_5F_967(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_977(12,77,64)*allowzero:0 -Reshape_393:Reshape*input:onnx_3A__3A_Reshape_5F_936(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_987(12,77,64)*allowzero:0 -Reshape_394:Reshape*input:onnx_3A__3A_Reshape_5F_953(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_997(12,77,64)*allowzero:0 -Transpose_395:Transpose*input:onnx_3A__3A_Transpose_5F_987(12,77,64)*output:onnx_3A__3A_MatMul_5F_999(12,64,77)*perm:0,2,1 -MatMul_396:MatMul*input:onnx_3A__3A_MatMul_5F_977(12,77,64);onnx_3A__3A_MatMul_5F_999(12,64,77)*output:onnx_3A__3A_Reshape_5F_1000(12,77,77) -Reshape_397:Reshape*input:onnx_3A__3A_Reshape_5F_1000(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1011(1,12,77,77)*allowzero:0 -Add_398:Add*input:onnx_3A__3A_Add_5F_1011(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1012(1,12,77,77) -Reshape_399:Reshape*input:onnx_3A__3A_Reshape_5F_1012(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_31(12,77,77)*allowzero:0 -Softmax_400:Softmax*input:attn_5F_weights_2E_31(12,77,77)*output:attn_5F_weights_2E_35(12,77,77)*axis:-1 -MatMul_401:MatMul*input:attn_5F_weights_2E_35(12,77,77);onnx_3A__3A_MatMul_5F_997(12,77,64)*output:onnx_3A__3A_Reshape_5F_1023(12,77,64) -Reshape_402:Reshape*input:onnx_3A__3A_Reshape_5F_1023(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1035(1,12,77,64)*allowzero:0 -Transpose_403:Transpose*input:onnx_3A__3A_Transpose_5F_1035(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1036(1,77,12,64)*perm:0,2,1,3 -Reshape_404:Reshape*input:onnx_3A__3A_Reshape_5F_1036(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1044(1,77,768)*allowzero:0 -MatMul_405:MatMul*input:onnx_3A__3A_MatMul_5F_1044(1,77,768);onnx_3A__3A_MatMul_5F_2528.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1046(1,77,768) -Add_406:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1046(1,77,768)*output:onnx_3A__3A_Add_5F_1047(1,77,768) -Add_407:Add*input:input_2E_39(1,77,768);onnx_3A__3A_Add_5F_1047(1,77,768)*output:input_2E_43(1,77,768) -ReduceMean_408:ReduceMean*input:input_2E_43(1,77,768)*output:onnx_3A__3A_Sub_5F_1049(1,77,1)*axes:-1 -Sub_409:Sub*input:input_2E_43(1,77,768);onnx_3A__3A_Sub_5F_1049(1,77,1)*output:onnx_3A__3A_Pow_5F_1050(1,77,768) -Pow_411:Pow*input:onnx_3A__3A_Pow_5F_1050(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1052(1,77,768) -ReduceMean_412:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1052(1,77,768)*output:onnx_3A__3A_Add_5F_1053(1,77,1)*axes:-1 -Add_414:Add*input:onnx_3A__3A_Add_5F_1053(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1055(1,77,1) -Sqrt_415:Sqrt*input:onnx_3A__3A_Sqrt_5F_1055(1,77,1)*output:onnx_3A__3A_Div_5F_1056(1,77,1) -Div_416:Div*input:onnx_3A__3A_Pow_5F_1050(1,77,768);onnx_3A__3A_Div_5F_1056(1,77,1)*output:onnx_3A__3A_Mul_5F_1057(1,77,768) -Mul_417:Mul*input:onnx_3A__3A_Mul_5F_1057(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1058(1,77,768) -Add_418:Add*input:onnx_3A__3A_Add_5F_1058(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1059(1,77,768) -MatMul_419:MatMul*input:onnx_3A__3A_MatMul_5F_1059(1,77,768);onnx_3A__3A_MatMul_5F_2529.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1061(1,77,3072) -Add_420:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1061(1,77,3072)*output:onnx_3A__3A_Mul_5F_1062(1,77,3072) -Mul_422:Mul*input:onnx_3A__3A_Mul_5F_1062(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1064(1,77,3072) -Sigmoid_423:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1064(1,77,3072)*output:onnx_3A__3A_Mul_5F_1065(1,77,3072) -Mul_424:Mul*input:onnx_3A__3A_Mul_5F_1062(1,77,3072);onnx_3A__3A_Mul_5F_1065(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1066(1,77,3072) -MatMul_425:MatMul*input:onnx_3A__3A_MatMul_5F_1066(1,77,3072);onnx_3A__3A_MatMul_5F_2530.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1068(1,77,768) -Add_426:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1068(1,77,768)*output:onnx_3A__3A_Add_5F_1069(1,77,768) -Add_427:Add*input:input_2E_43(1,77,768);onnx_3A__3A_Add_5F_1069(1,77,768)*output:input_2E_47(1,77,768) -ReduceMean_428:ReduceMean*input:input_2E_47(1,77,768)*output:onnx_3A__3A_Sub_5F_1071(1,77,1)*axes:-1 -Sub_429:Sub*input:input_2E_47(1,77,768);onnx_3A__3A_Sub_5F_1071(1,77,1)*output:onnx_3A__3A_Pow_5F_1072(1,77,768) -Pow_431:Pow*input:onnx_3A__3A_Pow_5F_1072(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1074(1,77,768) -ReduceMean_432:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1074(1,77,768)*output:onnx_3A__3A_Add_5F_1075(1,77,1)*axes:-1 -Add_434:Add*input:onnx_3A__3A_Add_5F_1075(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1077(1,77,1) -Sqrt_435:Sqrt*input:onnx_3A__3A_Sqrt_5F_1077(1,77,1)*output:onnx_3A__3A_Div_5F_1078(1,77,1) -Div_436:Div*input:onnx_3A__3A_Pow_5F_1072(1,77,768);onnx_3A__3A_Div_5F_1078(1,77,1)*output:onnx_3A__3A_Mul_5F_1079(1,77,768) -Mul_437:Mul*input:onnx_3A__3A_Mul_5F_1079(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1080(1,77,768) -Add_438:Add*input:onnx_3A__3A_Add_5F_1080(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1081(1,77,768) -MatMul_439:MatMul*input:onnx_3A__3A_MatMul_5F_1081(1,77,768);onnx_3A__3A_MatMul_5F_2531.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1086(1,77,768) -Add_440:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1086(1,77,768)*output:onnx_3A__3A_Mul_5F_1087(1,77,768) -Mul_442:Mul*input:onnx_3A__3A_Mul_5F_1087(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_19(1,77,768) -MatMul_443:MatMul*input:onnx_3A__3A_MatMul_5F_1081(1,77,768);onnx_3A__3A_MatMul_5F_2532.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1091(1,77,768) -Add_444:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1091(1,77,768)*output:onnx_3A__3A_Reshape_5F_1092(1,77,768) -Reshape_445:Reshape*input:onnx_3A__3A_Reshape_5F_1092(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1105(1,77,12,64)*allowzero:0 -Transpose_446:Transpose*input:onnx_3A__3A_Transpose_5F_1105(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1106(1,12,77,64)*perm:0,2,1,3 -MatMul_447:MatMul*input:onnx_3A__3A_MatMul_5F_1081(1,77,768);onnx_3A__3A_MatMul_5F_2538.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1108(1,77,768) -Add_448:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1108(1,77,768)*output:onnx_3A__3A_Reshape_5F_1109(1,77,768) -Reshape_449:Reshape*input:onnx_3A__3A_Reshape_5F_1109(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1122(1,77,12,64)*allowzero:0 -Transpose_450:Transpose*input:onnx_3A__3A_Transpose_5F_1122(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1123(1,12,77,64)*perm:0,2,1,3 -Reshape_451:Reshape*input:query_5F_states_2E_19(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1136(1,77,12,64)*allowzero:0 -Transpose_452:Transpose*input:onnx_3A__3A_Transpose_5F_1136(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1137(1,12,77,64)*perm:0,2,1,3 -Reshape_453:Reshape*input:onnx_3A__3A_Reshape_5F_1137(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1147(12,77,64)*allowzero:0 -Reshape_454:Reshape*input:onnx_3A__3A_Reshape_5F_1106(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1157(12,77,64)*allowzero:0 -Reshape_455:Reshape*input:onnx_3A__3A_Reshape_5F_1123(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1167(12,77,64)*allowzero:0 -Transpose_456:Transpose*input:onnx_3A__3A_Transpose_5F_1157(12,77,64)*output:onnx_3A__3A_MatMul_5F_1169(12,64,77)*perm:0,2,1 -MatMul_457:MatMul*input:onnx_3A__3A_MatMul_5F_1147(12,77,64);onnx_3A__3A_MatMul_5F_1169(12,64,77)*output:onnx_3A__3A_Reshape_5F_1170(12,77,77) -Reshape_458:Reshape*input:onnx_3A__3A_Reshape_5F_1170(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1181(1,12,77,77)*allowzero:0 -Add_459:Add*input:onnx_3A__3A_Add_5F_1181(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1182(1,12,77,77) -Reshape_460:Reshape*input:onnx_3A__3A_Reshape_5F_1182(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_39(12,77,77)*allowzero:0 -Softmax_461:Softmax*input:attn_5F_weights_2E_39(12,77,77)*output:attn_5F_weights_2E_43(12,77,77)*axis:-1 -MatMul_462:MatMul*input:attn_5F_weights_2E_43(12,77,77);onnx_3A__3A_MatMul_5F_1167(12,77,64)*output:onnx_3A__3A_Reshape_5F_1193(12,77,64) -Reshape_463:Reshape*input:onnx_3A__3A_Reshape_5F_1193(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1205(1,12,77,64)*allowzero:0 -Transpose_464:Transpose*input:onnx_3A__3A_Transpose_5F_1205(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1206(1,77,12,64)*perm:0,2,1,3 -Reshape_465:Reshape*input:onnx_3A__3A_Reshape_5F_1206(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1214(1,77,768)*allowzero:0 -MatMul_466:MatMul*input:onnx_3A__3A_MatMul_5F_1214(1,77,768);onnx_3A__3A_MatMul_5F_2579.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1216(1,77,768) -Add_467:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1216(1,77,768)*output:onnx_3A__3A_Add_5F_1217(1,77,768) -Add_468:Add*input:input_2E_47(1,77,768);onnx_3A__3A_Add_5F_1217(1,77,768)*output:input_2E_51(1,77,768) -ReduceMean_469:ReduceMean*input:input_2E_51(1,77,768)*output:onnx_3A__3A_Sub_5F_1219(1,77,1)*axes:-1 -Sub_470:Sub*input:input_2E_51(1,77,768);onnx_3A__3A_Sub_5F_1219(1,77,1)*output:onnx_3A__3A_Pow_5F_1220(1,77,768) -Pow_472:Pow*input:onnx_3A__3A_Pow_5F_1220(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1222(1,77,768) -ReduceMean_473:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1222(1,77,768)*output:onnx_3A__3A_Add_5F_1223(1,77,1)*axes:-1 -Add_475:Add*input:onnx_3A__3A_Add_5F_1223(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1225(1,77,1) -Sqrt_476:Sqrt*input:onnx_3A__3A_Sqrt_5F_1225(1,77,1)*output:onnx_3A__3A_Div_5F_1226(1,77,1) -Div_477:Div*input:onnx_3A__3A_Pow_5F_1220(1,77,768);onnx_3A__3A_Div_5F_1226(1,77,1)*output:onnx_3A__3A_Mul_5F_1227(1,77,768) -Mul_478:Mul*input:onnx_3A__3A_Mul_5F_1227(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1228(1,77,768) -Add_479:Add*input:onnx_3A__3A_Add_5F_1228(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1229(1,77,768) -MatMul_480:MatMul*input:onnx_3A__3A_MatMul_5F_1229(1,77,768);onnx_3A__3A_MatMul_5F_2580.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1231(1,77,3072) -Add_481:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1231(1,77,3072)*output:onnx_3A__3A_Mul_5F_1232(1,77,3072) -Mul_483:Mul*input:onnx_3A__3A_Mul_5F_1232(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1234(1,77,3072) -Sigmoid_484:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1234(1,77,3072)*output:onnx_3A__3A_Mul_5F_1235(1,77,3072) -Mul_485:Mul*input:onnx_3A__3A_Mul_5F_1232(1,77,3072);onnx_3A__3A_Mul_5F_1235(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1236(1,77,3072) -MatMul_486:MatMul*input:onnx_3A__3A_MatMul_5F_1236(1,77,3072);onnx_3A__3A_MatMul_5F_2581.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1238(1,77,768) -Add_487:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1238(1,77,768)*output:onnx_3A__3A_Add_5F_1239(1,77,768) -Add_488:Add*input:input_2E_51(1,77,768);onnx_3A__3A_Add_5F_1239(1,77,768)*output:input_2E_55(1,77,768) -ReduceMean_489:ReduceMean*input:input_2E_55(1,77,768)*output:onnx_3A__3A_Sub_5F_1241(1,77,1)*axes:-1 -Sub_490:Sub*input:input_2E_55(1,77,768);onnx_3A__3A_Sub_5F_1241(1,77,1)*output:onnx_3A__3A_Pow_5F_1242(1,77,768) -Pow_492:Pow*input:onnx_3A__3A_Pow_5F_1242(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1244(1,77,768) -ReduceMean_493:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1244(1,77,768)*output:onnx_3A__3A_Add_5F_1245(1,77,1)*axes:-1 -Add_495:Add*input:onnx_3A__3A_Add_5F_1245(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1247(1,77,1) -Sqrt_496:Sqrt*input:onnx_3A__3A_Sqrt_5F_1247(1,77,1)*output:onnx_3A__3A_Div_5F_1248(1,77,1) -Div_497:Div*input:onnx_3A__3A_Pow_5F_1242(1,77,768);onnx_3A__3A_Div_5F_1248(1,77,1)*output:onnx_3A__3A_Mul_5F_1249(1,77,768) -Mul_498:Mul*input:onnx_3A__3A_Mul_5F_1249(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1250(1,77,768) -Add_499:Add*input:onnx_3A__3A_Add_5F_1250(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1251(1,77,768) -MatMul_500:MatMul*input:onnx_3A__3A_MatMul_5F_1251(1,77,768);onnx_3A__3A_MatMul_5F_2582.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1256(1,77,768) -Add_501:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1256(1,77,768)*output:onnx_3A__3A_Mul_5F_1257(1,77,768) -Mul_503:Mul*input:onnx_3A__3A_Mul_5F_1257(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_23(1,77,768) -MatMul_504:MatMul*input:onnx_3A__3A_MatMul_5F_1251(1,77,768);onnx_3A__3A_MatMul_5F_2583.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1261(1,77,768) -Add_505:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1261(1,77,768)*output:onnx_3A__3A_Reshape_5F_1262(1,77,768) -Reshape_506:Reshape*input:onnx_3A__3A_Reshape_5F_1262(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1275(1,77,12,64)*allowzero:0 -Transpose_507:Transpose*input:onnx_3A__3A_Transpose_5F_1275(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1276(1,12,77,64)*perm:0,2,1,3 -MatMul_508:MatMul*input:onnx_3A__3A_MatMul_5F_1251(1,77,768);onnx_3A__3A_MatMul_5F_2589.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1278(1,77,768) -Add_509:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1278(1,77,768)*output:onnx_3A__3A_Reshape_5F_1279(1,77,768) -Reshape_510:Reshape*input:onnx_3A__3A_Reshape_5F_1279(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1292(1,77,12,64)*allowzero:0 -Transpose_511:Transpose*input:onnx_3A__3A_Transpose_5F_1292(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1293(1,12,77,64)*perm:0,2,1,3 -Reshape_512:Reshape*input:query_5F_states_2E_23(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1306(1,77,12,64)*allowzero:0 -Transpose_513:Transpose*input:onnx_3A__3A_Transpose_5F_1306(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1307(1,12,77,64)*perm:0,2,1,3 -Reshape_514:Reshape*input:onnx_3A__3A_Reshape_5F_1307(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1317(12,77,64)*allowzero:0 -Reshape_515:Reshape*input:onnx_3A__3A_Reshape_5F_1276(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1327(12,77,64)*allowzero:0 -Reshape_516:Reshape*input:onnx_3A__3A_Reshape_5F_1293(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1337(12,77,64)*allowzero:0 -Transpose_517:Transpose*input:onnx_3A__3A_Transpose_5F_1327(12,77,64)*output:onnx_3A__3A_MatMul_5F_1339(12,64,77)*perm:0,2,1 -MatMul_518:MatMul*input:onnx_3A__3A_MatMul_5F_1317(12,77,64);onnx_3A__3A_MatMul_5F_1339(12,64,77)*output:onnx_3A__3A_Reshape_5F_1340(12,77,77) -Reshape_519:Reshape*input:onnx_3A__3A_Reshape_5F_1340(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1351(1,12,77,77)*allowzero:0 -Add_520:Add*input:onnx_3A__3A_Add_5F_1351(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1352(1,12,77,77) -Reshape_521:Reshape*input:onnx_3A__3A_Reshape_5F_1352(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_47(12,77,77)*allowzero:0 -Softmax_522:Softmax*input:attn_5F_weights_2E_47(12,77,77)*output:attn_5F_weights_2E_51(12,77,77)*axis:-1 -MatMul_523:MatMul*input:attn_5F_weights_2E_51(12,77,77);onnx_3A__3A_MatMul_5F_1337(12,77,64)*output:onnx_3A__3A_Reshape_5F_1363(12,77,64) -Reshape_524:Reshape*input:onnx_3A__3A_Reshape_5F_1363(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1375(1,12,77,64)*allowzero:0 -Transpose_525:Transpose*input:onnx_3A__3A_Transpose_5F_1375(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1376(1,77,12,64)*perm:0,2,1,3 -Reshape_526:Reshape*input:onnx_3A__3A_Reshape_5F_1376(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1384(1,77,768)*allowzero:0 -MatMul_527:MatMul*input:onnx_3A__3A_MatMul_5F_1384(1,77,768);onnx_3A__3A_MatMul_5F_2630.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1386(1,77,768) -Add_528:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1386(1,77,768)*output:onnx_3A__3A_Add_5F_1387(1,77,768) -Add_529:Add*input:input_2E_55(1,77,768);onnx_3A__3A_Add_5F_1387(1,77,768)*output:input_2E_59(1,77,768) -ReduceMean_530:ReduceMean*input:input_2E_59(1,77,768)*output:onnx_3A__3A_Sub_5F_1389(1,77,1)*axes:-1 -Sub_531:Sub*input:input_2E_59(1,77,768);onnx_3A__3A_Sub_5F_1389(1,77,1)*output:onnx_3A__3A_Pow_5F_1390(1,77,768) -Pow_533:Pow*input:onnx_3A__3A_Pow_5F_1390(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1392(1,77,768) -ReduceMean_534:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1392(1,77,768)*output:onnx_3A__3A_Add_5F_1393(1,77,1)*axes:-1 -Add_536:Add*input:onnx_3A__3A_Add_5F_1393(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1395(1,77,1) -Sqrt_537:Sqrt*input:onnx_3A__3A_Sqrt_5F_1395(1,77,1)*output:onnx_3A__3A_Div_5F_1396(1,77,1) -Div_538:Div*input:onnx_3A__3A_Pow_5F_1390(1,77,768);onnx_3A__3A_Div_5F_1396(1,77,1)*output:onnx_3A__3A_Mul_5F_1397(1,77,768) -Mul_539:Mul*input:onnx_3A__3A_Mul_5F_1397(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1398(1,77,768) -Add_540:Add*input:onnx_3A__3A_Add_5F_1398(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1399(1,77,768) -MatMul_541:MatMul*input:onnx_3A__3A_MatMul_5F_1399(1,77,768);onnx_3A__3A_MatMul_5F_2631.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1401(1,77,3072) -Add_542:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1401(1,77,3072)*output:onnx_3A__3A_Mul_5F_1402(1,77,3072) -Mul_544:Mul*input:onnx_3A__3A_Mul_5F_1402(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1404(1,77,3072) -Sigmoid_545:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1404(1,77,3072)*output:onnx_3A__3A_Mul_5F_1405(1,77,3072) -Mul_546:Mul*input:onnx_3A__3A_Mul_5F_1402(1,77,3072);onnx_3A__3A_Mul_5F_1405(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1406(1,77,3072) -MatMul_547:MatMul*input:onnx_3A__3A_MatMul_5F_1406(1,77,3072);onnx_3A__3A_MatMul_5F_2632.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1408(1,77,768) -Add_548:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1408(1,77,768)*output:onnx_3A__3A_Add_5F_1409(1,77,768) -Add_549:Add*input:input_2E_59(1,77,768);onnx_3A__3A_Add_5F_1409(1,77,768)*output:input_2E_63(1,77,768) -ReduceMean_550:ReduceMean*input:input_2E_63(1,77,768)*output:onnx_3A__3A_Sub_5F_1411(1,77,1)*axes:-1 -Sub_551:Sub*input:input_2E_63(1,77,768);onnx_3A__3A_Sub_5F_1411(1,77,1)*output:onnx_3A__3A_Pow_5F_1412(1,77,768) -Pow_553:Pow*input:onnx_3A__3A_Pow_5F_1412(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1414(1,77,768) -ReduceMean_554:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1414(1,77,768)*output:onnx_3A__3A_Add_5F_1415(1,77,1)*axes:-1 -Add_556:Add*input:onnx_3A__3A_Add_5F_1415(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1417(1,77,1) -Sqrt_557:Sqrt*input:onnx_3A__3A_Sqrt_5F_1417(1,77,1)*output:onnx_3A__3A_Div_5F_1418(1,77,1) -Div_558:Div*input:onnx_3A__3A_Pow_5F_1412(1,77,768);onnx_3A__3A_Div_5F_1418(1,77,1)*output:onnx_3A__3A_Mul_5F_1419(1,77,768) -Mul_559:Mul*input:onnx_3A__3A_Mul_5F_1419(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1420(1,77,768) -Add_560:Add*input:onnx_3A__3A_Add_5F_1420(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1421(1,77,768) -MatMul_561:MatMul*input:onnx_3A__3A_MatMul_5F_1421(1,77,768);onnx_3A__3A_MatMul_5F_2633.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1426(1,77,768) -Add_562:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1426(1,77,768)*output:onnx_3A__3A_Mul_5F_1427(1,77,768) -Mul_564:Mul*input:onnx_3A__3A_Mul_5F_1427(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_27(1,77,768) -MatMul_565:MatMul*input:onnx_3A__3A_MatMul_5F_1421(1,77,768);onnx_3A__3A_MatMul_5F_2634.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1431(1,77,768) -Add_566:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1431(1,77,768)*output:onnx_3A__3A_Reshape_5F_1432(1,77,768) -Reshape_567:Reshape*input:onnx_3A__3A_Reshape_5F_1432(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1445(1,77,12,64)*allowzero:0 -Transpose_568:Transpose*input:onnx_3A__3A_Transpose_5F_1445(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1446(1,12,77,64)*perm:0,2,1,3 -MatMul_569:MatMul*input:onnx_3A__3A_MatMul_5F_1421(1,77,768);onnx_3A__3A_MatMul_5F_2640.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1448(1,77,768) -Add_570:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1448(1,77,768)*output:onnx_3A__3A_Reshape_5F_1449(1,77,768) -Reshape_571:Reshape*input:onnx_3A__3A_Reshape_5F_1449(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1462(1,77,12,64)*allowzero:0 -Transpose_572:Transpose*input:onnx_3A__3A_Transpose_5F_1462(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1463(1,12,77,64)*perm:0,2,1,3 -Reshape_573:Reshape*input:query_5F_states_2E_27(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1476(1,77,12,64)*allowzero:0 -Transpose_574:Transpose*input:onnx_3A__3A_Transpose_5F_1476(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1477(1,12,77,64)*perm:0,2,1,3 -Reshape_575:Reshape*input:onnx_3A__3A_Reshape_5F_1477(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1487(12,77,64)*allowzero:0 -Reshape_576:Reshape*input:onnx_3A__3A_Reshape_5F_1446(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1497(12,77,64)*allowzero:0 -Reshape_577:Reshape*input:onnx_3A__3A_Reshape_5F_1463(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1507(12,77,64)*allowzero:0 -Transpose_578:Transpose*input:onnx_3A__3A_Transpose_5F_1497(12,77,64)*output:onnx_3A__3A_MatMul_5F_1509(12,64,77)*perm:0,2,1 -MatMul_579:MatMul*input:onnx_3A__3A_MatMul_5F_1487(12,77,64);onnx_3A__3A_MatMul_5F_1509(12,64,77)*output:onnx_3A__3A_Reshape_5F_1510(12,77,77) -Reshape_580:Reshape*input:onnx_3A__3A_Reshape_5F_1510(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1521(1,12,77,77)*allowzero:0 -Add_581:Add*input:onnx_3A__3A_Add_5F_1521(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1522(1,12,77,77) -Reshape_582:Reshape*input:onnx_3A__3A_Reshape_5F_1522(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_55(12,77,77)*allowzero:0 -Softmax_583:Softmax*input:attn_5F_weights_2E_55(12,77,77)*output:attn_5F_weights_2E_59(12,77,77)*axis:-1 -MatMul_584:MatMul*input:attn_5F_weights_2E_59(12,77,77);onnx_3A__3A_MatMul_5F_1507(12,77,64)*output:onnx_3A__3A_Reshape_5F_1533(12,77,64) -Reshape_585:Reshape*input:onnx_3A__3A_Reshape_5F_1533(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1545(1,12,77,64)*allowzero:0 -Transpose_586:Transpose*input:onnx_3A__3A_Transpose_5F_1545(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1546(1,77,12,64)*perm:0,2,1,3 -Reshape_587:Reshape*input:onnx_3A__3A_Reshape_5F_1546(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1554(1,77,768)*allowzero:0 -MatMul_588:MatMul*input:onnx_3A__3A_MatMul_5F_1554(1,77,768);onnx_3A__3A_MatMul_5F_2681.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1556(1,77,768) -Add_589:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1556(1,77,768)*output:onnx_3A__3A_Add_5F_1557(1,77,768) -Add_590:Add*input:input_2E_63(1,77,768);onnx_3A__3A_Add_5F_1557(1,77,768)*output:input_2E_67(1,77,768) -ReduceMean_591:ReduceMean*input:input_2E_67(1,77,768)*output:onnx_3A__3A_Sub_5F_1559(1,77,1)*axes:-1 -Sub_592:Sub*input:input_2E_67(1,77,768);onnx_3A__3A_Sub_5F_1559(1,77,1)*output:onnx_3A__3A_Pow_5F_1560(1,77,768) -Pow_594:Pow*input:onnx_3A__3A_Pow_5F_1560(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1562(1,77,768) -ReduceMean_595:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1562(1,77,768)*output:onnx_3A__3A_Add_5F_1563(1,77,1)*axes:-1 -Add_597:Add*input:onnx_3A__3A_Add_5F_1563(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1565(1,77,1) -Sqrt_598:Sqrt*input:onnx_3A__3A_Sqrt_5F_1565(1,77,1)*output:onnx_3A__3A_Div_5F_1566(1,77,1) -Div_599:Div*input:onnx_3A__3A_Pow_5F_1560(1,77,768);onnx_3A__3A_Div_5F_1566(1,77,1)*output:onnx_3A__3A_Mul_5F_1567(1,77,768) -Mul_600:Mul*input:onnx_3A__3A_Mul_5F_1567(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1568(1,77,768) -Add_601:Add*input:onnx_3A__3A_Add_5F_1568(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1569(1,77,768) -MatMul_602:MatMul*input:onnx_3A__3A_MatMul_5F_1569(1,77,768);onnx_3A__3A_MatMul_5F_2682.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1571(1,77,3072) -Add_603:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1571(1,77,3072)*output:onnx_3A__3A_Mul_5F_1572(1,77,3072) -Mul_605:Mul*input:onnx_3A__3A_Mul_5F_1572(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1574(1,77,3072) -Sigmoid_606:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1574(1,77,3072)*output:onnx_3A__3A_Mul_5F_1575(1,77,3072) -Mul_607:Mul*input:onnx_3A__3A_Mul_5F_1572(1,77,3072);onnx_3A__3A_Mul_5F_1575(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1576(1,77,3072) -MatMul_608:MatMul*input:onnx_3A__3A_MatMul_5F_1576(1,77,3072);onnx_3A__3A_MatMul_5F_2683.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1578(1,77,768) -Add_609:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1578(1,77,768)*output:onnx_3A__3A_Add_5F_1579(1,77,768) -Add_610:Add*input:input_2E_67(1,77,768);onnx_3A__3A_Add_5F_1579(1,77,768)*output:input_2E_71(1,77,768) -ReduceMean_611:ReduceMean*input:input_2E_71(1,77,768)*output:onnx_3A__3A_Sub_5F_1581(1,77,1)*axes:-1 -Sub_612:Sub*input:input_2E_71(1,77,768);onnx_3A__3A_Sub_5F_1581(1,77,1)*output:onnx_3A__3A_Pow_5F_1582(1,77,768) -Pow_614:Pow*input:onnx_3A__3A_Pow_5F_1582(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1584(1,77,768) -ReduceMean_615:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1584(1,77,768)*output:onnx_3A__3A_Add_5F_1585(1,77,1)*axes:-1 -Add_617:Add*input:onnx_3A__3A_Add_5F_1585(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1587(1,77,1) -Sqrt_618:Sqrt*input:onnx_3A__3A_Sqrt_5F_1587(1,77,1)*output:onnx_3A__3A_Div_5F_1588(1,77,1) -Div_619:Div*input:onnx_3A__3A_Pow_5F_1582(1,77,768);onnx_3A__3A_Div_5F_1588(1,77,1)*output:onnx_3A__3A_Mul_5F_1589(1,77,768) -Mul_620:Mul*input:onnx_3A__3A_Mul_5F_1589(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1590(1,77,768) -Add_621:Add*input:onnx_3A__3A_Add_5F_1590(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1591(1,77,768) -MatMul_622:MatMul*input:onnx_3A__3A_MatMul_5F_1591(1,77,768);onnx_3A__3A_MatMul_5F_2684.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1596(1,77,768) -Add_623:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1596(1,77,768)*output:onnx_3A__3A_Mul_5F_1597(1,77,768) -Mul_625:Mul*input:onnx_3A__3A_Mul_5F_1597(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_31(1,77,768) -MatMul_626:MatMul*input:onnx_3A__3A_MatMul_5F_1591(1,77,768);onnx_3A__3A_MatMul_5F_2685.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1601(1,77,768) -Add_627:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1601(1,77,768)*output:onnx_3A__3A_Reshape_5F_1602(1,77,768) -Reshape_628:Reshape*input:onnx_3A__3A_Reshape_5F_1602(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1615(1,77,12,64)*allowzero:0 -Transpose_629:Transpose*input:onnx_3A__3A_Transpose_5F_1615(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1616(1,12,77,64)*perm:0,2,1,3 -MatMul_630:MatMul*input:onnx_3A__3A_MatMul_5F_1591(1,77,768);onnx_3A__3A_MatMul_5F_2691.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1618(1,77,768) -Add_631:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1618(1,77,768)*output:onnx_3A__3A_Reshape_5F_1619(1,77,768) -Reshape_632:Reshape*input:onnx_3A__3A_Reshape_5F_1619(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1632(1,77,12,64)*allowzero:0 -Transpose_633:Transpose*input:onnx_3A__3A_Transpose_5F_1632(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1633(1,12,77,64)*perm:0,2,1,3 -Reshape_634:Reshape*input:query_5F_states_2E_31(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1646(1,77,12,64)*allowzero:0 -Transpose_635:Transpose*input:onnx_3A__3A_Transpose_5F_1646(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1647(1,12,77,64)*perm:0,2,1,3 -Reshape_636:Reshape*input:onnx_3A__3A_Reshape_5F_1647(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1657(12,77,64)*allowzero:0 -Reshape_637:Reshape*input:onnx_3A__3A_Reshape_5F_1616(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1667(12,77,64)*allowzero:0 -Reshape_638:Reshape*input:onnx_3A__3A_Reshape_5F_1633(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1677(12,77,64)*allowzero:0 -Transpose_639:Transpose*input:onnx_3A__3A_Transpose_5F_1667(12,77,64)*output:onnx_3A__3A_MatMul_5F_1679(12,64,77)*perm:0,2,1 -MatMul_640:MatMul*input:onnx_3A__3A_MatMul_5F_1657(12,77,64);onnx_3A__3A_MatMul_5F_1679(12,64,77)*output:onnx_3A__3A_Reshape_5F_1680(12,77,77) -Reshape_641:Reshape*input:onnx_3A__3A_Reshape_5F_1680(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1691(1,12,77,77)*allowzero:0 -Add_642:Add*input:onnx_3A__3A_Add_5F_1691(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1692(1,12,77,77) -Reshape_643:Reshape*input:onnx_3A__3A_Reshape_5F_1692(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_63(12,77,77)*allowzero:0 -Softmax_644:Softmax*input:attn_5F_weights_2E_63(12,77,77)*output:attn_5F_weights_2E_67(12,77,77)*axis:-1 -MatMul_645:MatMul*input:attn_5F_weights_2E_67(12,77,77);onnx_3A__3A_MatMul_5F_1677(12,77,64)*output:onnx_3A__3A_Reshape_5F_1703(12,77,64) -Reshape_646:Reshape*input:onnx_3A__3A_Reshape_5F_1703(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1715(1,12,77,64)*allowzero:0 -Transpose_647:Transpose*input:onnx_3A__3A_Transpose_5F_1715(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1716(1,77,12,64)*perm:0,2,1,3 -Reshape_648:Reshape*input:onnx_3A__3A_Reshape_5F_1716(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1724(1,77,768)*allowzero:0 -MatMul_649:MatMul*input:onnx_3A__3A_MatMul_5F_1724(1,77,768);onnx_3A__3A_MatMul_5F_2732.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1726(1,77,768) -Add_650:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1726(1,77,768)*output:onnx_3A__3A_Add_5F_1727(1,77,768) -Add_651:Add*input:input_2E_71(1,77,768);onnx_3A__3A_Add_5F_1727(1,77,768)*output:input_2E_75(1,77,768) -ReduceMean_652:ReduceMean*input:input_2E_75(1,77,768)*output:onnx_3A__3A_Sub_5F_1729(1,77,1)*axes:-1 -Sub_653:Sub*input:input_2E_75(1,77,768);onnx_3A__3A_Sub_5F_1729(1,77,1)*output:onnx_3A__3A_Pow_5F_1730(1,77,768) -Pow_655:Pow*input:onnx_3A__3A_Pow_5F_1730(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1732(1,77,768) -ReduceMean_656:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1732(1,77,768)*output:onnx_3A__3A_Add_5F_1733(1,77,1)*axes:-1 -Add_658:Add*input:onnx_3A__3A_Add_5F_1733(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1735(1,77,1) -Sqrt_659:Sqrt*input:onnx_3A__3A_Sqrt_5F_1735(1,77,1)*output:onnx_3A__3A_Div_5F_1736(1,77,1) -Div_660:Div*input:onnx_3A__3A_Pow_5F_1730(1,77,768);onnx_3A__3A_Div_5F_1736(1,77,1)*output:onnx_3A__3A_Mul_5F_1737(1,77,768) -Mul_661:Mul*input:onnx_3A__3A_Mul_5F_1737(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1738(1,77,768) -Add_662:Add*input:onnx_3A__3A_Add_5F_1738(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1739(1,77,768) -MatMul_663:MatMul*input:onnx_3A__3A_MatMul_5F_1739(1,77,768);onnx_3A__3A_MatMul_5F_2733.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1741(1,77,3072) -Add_664:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1741(1,77,3072)*output:onnx_3A__3A_Mul_5F_1742(1,77,3072) -Mul_666:Mul*input:onnx_3A__3A_Mul_5F_1742(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1744(1,77,3072) -Sigmoid_667:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1744(1,77,3072)*output:onnx_3A__3A_Mul_5F_1745(1,77,3072) -Mul_668:Mul*input:onnx_3A__3A_Mul_5F_1742(1,77,3072);onnx_3A__3A_Mul_5F_1745(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1746(1,77,3072) -MatMul_669:MatMul*input:onnx_3A__3A_MatMul_5F_1746(1,77,3072);onnx_3A__3A_MatMul_5F_2734.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1748(1,77,768) -Add_670:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1748(1,77,768)*output:onnx_3A__3A_Add_5F_1749(1,77,768) -Add_671:Add*input:input_2E_75(1,77,768);onnx_3A__3A_Add_5F_1749(1,77,768)*output:input_2E_79(1,77,768) -ReduceMean_672:ReduceMean*input:input_2E_79(1,77,768)*output:onnx_3A__3A_Sub_5F_1751(1,77,1)*axes:-1 -Sub_673:Sub*input:input_2E_79(1,77,768);onnx_3A__3A_Sub_5F_1751(1,77,1)*output:onnx_3A__3A_Pow_5F_1752(1,77,768) -Pow_675:Pow*input:onnx_3A__3A_Pow_5F_1752(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1754(1,77,768) -ReduceMean_676:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1754(1,77,768)*output:onnx_3A__3A_Add_5F_1755(1,77,1)*axes:-1 -Add_678:Add*input:onnx_3A__3A_Add_5F_1755(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1757(1,77,1) -Sqrt_679:Sqrt*input:onnx_3A__3A_Sqrt_5F_1757(1,77,1)*output:onnx_3A__3A_Div_5F_1758(1,77,1) -Div_680:Div*input:onnx_3A__3A_Pow_5F_1752(1,77,768);onnx_3A__3A_Div_5F_1758(1,77,1)*output:onnx_3A__3A_Mul_5F_1759(1,77,768) -Mul_681:Mul*input:onnx_3A__3A_Mul_5F_1759(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1760(1,77,768) -Add_682:Add*input:onnx_3A__3A_Add_5F_1760(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1761(1,77,768) -MatMul_683:MatMul*input:onnx_3A__3A_MatMul_5F_1761(1,77,768);onnx_3A__3A_MatMul_5F_2735.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1766(1,77,768) -Add_684:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1766(1,77,768)*output:onnx_3A__3A_Mul_5F_1767(1,77,768) -Mul_686:Mul*input:onnx_3A__3A_Mul_5F_1767(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_35(1,77,768) -MatMul_687:MatMul*input:onnx_3A__3A_MatMul_5F_1761(1,77,768);onnx_3A__3A_MatMul_5F_2736.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1771(1,77,768) -Add_688:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1771(1,77,768)*output:onnx_3A__3A_Reshape_5F_1772(1,77,768) -Reshape_689:Reshape*input:onnx_3A__3A_Reshape_5F_1772(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1785(1,77,12,64)*allowzero:0 -Transpose_690:Transpose*input:onnx_3A__3A_Transpose_5F_1785(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1786(1,12,77,64)*perm:0,2,1,3 -MatMul_691:MatMul*input:onnx_3A__3A_MatMul_5F_1761(1,77,768);onnx_3A__3A_MatMul_5F_2742.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1788(1,77,768) -Add_692:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1788(1,77,768)*output:onnx_3A__3A_Reshape_5F_1789(1,77,768) -Reshape_693:Reshape*input:onnx_3A__3A_Reshape_5F_1789(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1802(1,77,12,64)*allowzero:0 -Transpose_694:Transpose*input:onnx_3A__3A_Transpose_5F_1802(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1803(1,12,77,64)*perm:0,2,1,3 -Reshape_695:Reshape*input:query_5F_states_2E_35(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1816(1,77,12,64)*allowzero:0 -Transpose_696:Transpose*input:onnx_3A__3A_Transpose_5F_1816(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1817(1,12,77,64)*perm:0,2,1,3 -Reshape_697:Reshape*input:onnx_3A__3A_Reshape_5F_1817(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1827(12,77,64)*allowzero:0 -Reshape_698:Reshape*input:onnx_3A__3A_Reshape_5F_1786(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1837(12,77,64)*allowzero:0 -Reshape_699:Reshape*input:onnx_3A__3A_Reshape_5F_1803(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1847(12,77,64)*allowzero:0 -Transpose_700:Transpose*input:onnx_3A__3A_Transpose_5F_1837(12,77,64)*output:onnx_3A__3A_MatMul_5F_1849(12,64,77)*perm:0,2,1 -MatMul_701:MatMul*input:onnx_3A__3A_MatMul_5F_1827(12,77,64);onnx_3A__3A_MatMul_5F_1849(12,64,77)*output:onnx_3A__3A_Reshape_5F_1850(12,77,77) -Reshape_702:Reshape*input:onnx_3A__3A_Reshape_5F_1850(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1861(1,12,77,77)*allowzero:0 -Add_703:Add*input:onnx_3A__3A_Add_5F_1861(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1862(1,12,77,77) -Reshape_704:Reshape*input:onnx_3A__3A_Reshape_5F_1862(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_71(12,77,77)*allowzero:0 -Softmax_705:Softmax*input:attn_5F_weights_2E_71(12,77,77)*output:attn_5F_weights_2E_75(12,77,77)*axis:-1 -MatMul_706:MatMul*input:attn_5F_weights_2E_75(12,77,77);onnx_3A__3A_MatMul_5F_1847(12,77,64)*output:onnx_3A__3A_Reshape_5F_1873(12,77,64) -Reshape_707:Reshape*input:onnx_3A__3A_Reshape_5F_1873(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1885(1,12,77,64)*allowzero:0 -Transpose_708:Transpose*input:onnx_3A__3A_Transpose_5F_1885(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1886(1,77,12,64)*perm:0,2,1,3 -Reshape_709:Reshape*input:onnx_3A__3A_Reshape_5F_1886(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1894(1,77,768)*allowzero:0 -MatMul_710:MatMul*input:onnx_3A__3A_MatMul_5F_1894(1,77,768);onnx_3A__3A_MatMul_5F_2783.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1896(1,77,768) -Add_711:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1896(1,77,768)*output:onnx_3A__3A_Add_5F_1897(1,77,768) -Add_712:Add*input:input_2E_79(1,77,768);onnx_3A__3A_Add_5F_1897(1,77,768)*output:input_2E_83(1,77,768) -ReduceMean_713:ReduceMean*input:input_2E_83(1,77,768)*output:onnx_3A__3A_Sub_5F_1899(1,77,1)*axes:-1 -Sub_714:Sub*input:input_2E_83(1,77,768);onnx_3A__3A_Sub_5F_1899(1,77,1)*output:onnx_3A__3A_Pow_5F_1900(1,77,768) -Pow_716:Pow*input:onnx_3A__3A_Pow_5F_1900(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1902(1,77,768) -ReduceMean_717:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1902(1,77,768)*output:onnx_3A__3A_Add_5F_1903(1,77,1)*axes:-1 -Add_719:Add*input:onnx_3A__3A_Add_5F_1903(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1905(1,77,1) -Sqrt_720:Sqrt*input:onnx_3A__3A_Sqrt_5F_1905(1,77,1)*output:onnx_3A__3A_Div_5F_1906(1,77,1) -Div_721:Div*input:onnx_3A__3A_Pow_5F_1900(1,77,768);onnx_3A__3A_Div_5F_1906(1,77,1)*output:onnx_3A__3A_Mul_5F_1907(1,77,768) -Mul_722:Mul*input:onnx_3A__3A_Mul_5F_1907(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1908(1,77,768) -Add_723:Add*input:onnx_3A__3A_Add_5F_1908(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1909(1,77,768) -MatMul_724:MatMul*input:onnx_3A__3A_MatMul_5F_1909(1,77,768);onnx_3A__3A_MatMul_5F_2784.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1911(1,77,3072) -Add_725:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1911(1,77,3072)*output:onnx_3A__3A_Mul_5F_1912(1,77,3072) -Mul_727:Mul*input:onnx_3A__3A_Mul_5F_1912(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1914(1,77,3072) -Sigmoid_728:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1914(1,77,3072)*output:onnx_3A__3A_Mul_5F_1915(1,77,3072) -Mul_729:Mul*input:onnx_3A__3A_Mul_5F_1912(1,77,3072);onnx_3A__3A_Mul_5F_1915(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1916(1,77,3072) -MatMul_730:MatMul*input:onnx_3A__3A_MatMul_5F_1916(1,77,3072);onnx_3A__3A_MatMul_5F_2785.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1918(1,77,768) -Add_731:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1918(1,77,768)*output:onnx_3A__3A_Add_5F_1919(1,77,768) -Add_732:Add*input:input_2E_83(1,77,768);onnx_3A__3A_Add_5F_1919(1,77,768)*output:input_2E_87(1,77,768) -ReduceMean_733:ReduceMean*input:input_2E_87(1,77,768)*output:onnx_3A__3A_Sub_5F_1921(1,77,1)*axes:-1 -Sub_734:Sub*input:input_2E_87(1,77,768);onnx_3A__3A_Sub_5F_1921(1,77,1)*output:onnx_3A__3A_Pow_5F_1922(1,77,768) -Pow_736:Pow*input:onnx_3A__3A_Pow_5F_1922(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1924(1,77,768) -ReduceMean_737:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1924(1,77,768)*output:onnx_3A__3A_Add_5F_1925(1,77,1)*axes:-1 -Add_739:Add*input:onnx_3A__3A_Add_5F_1925(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1927(1,77,1) -Sqrt_740:Sqrt*input:onnx_3A__3A_Sqrt_5F_1927(1,77,1)*output:onnx_3A__3A_Div_5F_1928(1,77,1) -Div_741:Div*input:onnx_3A__3A_Pow_5F_1922(1,77,768);onnx_3A__3A_Div_5F_1928(1,77,1)*output:onnx_3A__3A_Mul_5F_1929(1,77,768) -Mul_742:Mul*input:onnx_3A__3A_Mul_5F_1929(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1930(1,77,768) -Add_743:Add*input:onnx_3A__3A_Add_5F_1930(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1931(1,77,768) -MatMul_744:MatMul*input:onnx_3A__3A_MatMul_5F_1931(1,77,768);onnx_3A__3A_MatMul_5F_2786.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1936(1,77,768) -Add_745:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1936(1,77,768)*output:onnx_3A__3A_Mul_5F_1937(1,77,768) -Mul_747:Mul*input:onnx_3A__3A_Mul_5F_1937(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_39(1,77,768) -MatMul_748:MatMul*input:onnx_3A__3A_MatMul_5F_1931(1,77,768);onnx_3A__3A_MatMul_5F_2787.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1941(1,77,768) -Add_749:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1941(1,77,768)*output:onnx_3A__3A_Reshape_5F_1942(1,77,768) -Reshape_750:Reshape*input:onnx_3A__3A_Reshape_5F_1942(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1955(1,77,12,64)*allowzero:0 -Transpose_751:Transpose*input:onnx_3A__3A_Transpose_5F_1955(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1956(1,12,77,64)*perm:0,2,1,3 -MatMul_752:MatMul*input:onnx_3A__3A_MatMul_5F_1931(1,77,768);onnx_3A__3A_MatMul_5F_2793.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1958(1,77,768) -Add_753:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1958(1,77,768)*output:onnx_3A__3A_Reshape_5F_1959(1,77,768) -Reshape_754:Reshape*input:onnx_3A__3A_Reshape_5F_1959(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1972(1,77,12,64)*allowzero:0 -Transpose_755:Transpose*input:onnx_3A__3A_Transpose_5F_1972(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1973(1,12,77,64)*perm:0,2,1,3 -Reshape_756:Reshape*input:query_5F_states_2E_39(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1986(1,77,12,64)*allowzero:0 -Transpose_757:Transpose*input:onnx_3A__3A_Transpose_5F_1986(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1987(1,12,77,64)*perm:0,2,1,3 -Reshape_758:Reshape*input:onnx_3A__3A_Reshape_5F_1987(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1997(12,77,64)*allowzero:0 -Reshape_759:Reshape*input:onnx_3A__3A_Reshape_5F_1956(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_2007(12,77,64)*allowzero:0 -Reshape_760:Reshape*input:onnx_3A__3A_Reshape_5F_1973(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2017(12,77,64)*allowzero:0 -Transpose_761:Transpose*input:onnx_3A__3A_Transpose_5F_2007(12,77,64)*output:onnx_3A__3A_MatMul_5F_2019(12,64,77)*perm:0,2,1 -MatMul_762:MatMul*input:onnx_3A__3A_MatMul_5F_1997(12,77,64);onnx_3A__3A_MatMul_5F_2019(12,64,77)*output:onnx_3A__3A_Reshape_5F_2020(12,77,77) -Reshape_763:Reshape*input:onnx_3A__3A_Reshape_5F_2020(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_2031(1,12,77,77)*allowzero:0 -Add_764:Add*input:onnx_3A__3A_Add_5F_2031(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_2032(1,12,77,77) -Reshape_765:Reshape*input:onnx_3A__3A_Reshape_5F_2032(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_79(12,77,77)*allowzero:0 -Softmax_766:Softmax*input:attn_5F_weights_2E_79(12,77,77)*output:attn_5F_weights_2E_83(12,77,77)*axis:-1 -MatMul_767:MatMul*input:attn_5F_weights_2E_83(12,77,77);onnx_3A__3A_MatMul_5F_2017(12,77,64)*output:onnx_3A__3A_Reshape_5F_2043(12,77,64) -Reshape_768:Reshape*input:onnx_3A__3A_Reshape_5F_2043(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2055(1,12,77,64)*allowzero:0 -Transpose_769:Transpose*input:onnx_3A__3A_Transpose_5F_2055(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_2056(1,77,12,64)*perm:0,2,1,3 -Reshape_770:Reshape*input:onnx_3A__3A_Reshape_5F_2056(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2064(1,77,768)*allowzero:0 -MatMul_771:MatMul*input:onnx_3A__3A_MatMul_5F_2064(1,77,768);onnx_3A__3A_MatMul_5F_2834.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2066(1,77,768) -Add_772:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2066(1,77,768)*output:onnx_3A__3A_Add_5F_2067(1,77,768) -Add_773:Add*input:input_2E_87(1,77,768);onnx_3A__3A_Add_5F_2067(1,77,768)*output:input_2E_91(1,77,768) -ReduceMean_774:ReduceMean*input:input_2E_91(1,77,768)*output:onnx_3A__3A_Sub_5F_2069(1,77,1)*axes:-1 -Sub_775:Sub*input:input_2E_91(1,77,768);onnx_3A__3A_Sub_5F_2069(1,77,1)*output:onnx_3A__3A_Pow_5F_2070(1,77,768) -Pow_777:Pow*input:onnx_3A__3A_Pow_5F_2070(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_2072(1,77,768) -ReduceMean_778:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_2072(1,77,768)*output:onnx_3A__3A_Add_5F_2073(1,77,1)*axes:-1 -Add_780:Add*input:onnx_3A__3A_Add_5F_2073(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_2075(1,77,1) -Sqrt_781:Sqrt*input:onnx_3A__3A_Sqrt_5F_2075(1,77,1)*output:onnx_3A__3A_Div_5F_2076(1,77,1) -Div_782:Div*input:onnx_3A__3A_Pow_5F_2070(1,77,768);onnx_3A__3A_Div_5F_2076(1,77,1)*output:onnx_3A__3A_Mul_5F_2077(1,77,768) -Mul_783:Mul*input:onnx_3A__3A_Mul_5F_2077(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_2078(1,77,768) -Add_784:Add*input:onnx_3A__3A_Add_5F_2078(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_2079(1,77,768) -MatMul_785:MatMul*input:onnx_3A__3A_MatMul_5F_2079(1,77,768);onnx_3A__3A_MatMul_5F_2835.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_2081(1,77,3072) -Add_786:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_2081(1,77,3072)*output:onnx_3A__3A_Mul_5F_2082(1,77,3072) -Mul_788:Mul*input:onnx_3A__3A_Mul_5F_2082(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_2084(1,77,3072) -Sigmoid_789:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_2084(1,77,3072)*output:onnx_3A__3A_Mul_5F_2085(1,77,3072) -Mul_790:Mul*input:onnx_3A__3A_Mul_5F_2082(1,77,3072);onnx_3A__3A_Mul_5F_2085(1,77,3072)*output:onnx_3A__3A_MatMul_5F_2086(1,77,3072) -MatMul_791:MatMul*input:onnx_3A__3A_MatMul_5F_2086(1,77,3072);onnx_3A__3A_MatMul_5F_2836.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_2088(1,77,768) -Add_792:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2088(1,77,768)*output:onnx_3A__3A_Add_5F_2089(1,77,768) -Add_793:Add*input:input_2E_91(1,77,768);onnx_3A__3A_Add_5F_2089(1,77,768)*output:input_2E_95(1,77,768) -ReduceMean_794:ReduceMean*input:input_2E_95(1,77,768)*output:onnx_3A__3A_Sub_5F_2091(1,77,1)*axes:-1 -Sub_795:Sub*input:input_2E_95(1,77,768);onnx_3A__3A_Sub_5F_2091(1,77,1)*output:onnx_3A__3A_Pow_5F_2092(1,77,768) -Pow_797:Pow*input:onnx_3A__3A_Pow_5F_2092(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_2094(1,77,768) -ReduceMean_798:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_2094(1,77,768)*output:onnx_3A__3A_Add_5F_2095(1,77,1)*axes:-1 -Add_800:Add*input:onnx_3A__3A_Add_5F_2095(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_2097(1,77,1) -Sqrt_801:Sqrt*input:onnx_3A__3A_Sqrt_5F_2097(1,77,1)*output:onnx_3A__3A_Div_5F_2098(1,77,1) -Div_802:Div*input:onnx_3A__3A_Pow_5F_2092(1,77,768);onnx_3A__3A_Div_5F_2098(1,77,1)*output:onnx_3A__3A_Mul_5F_2099(1,77,768) -Mul_803:Mul*input:onnx_3A__3A_Mul_5F_2099(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_2100(1,77,768) -Add_804:Add*input:onnx_3A__3A_Add_5F_2100(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_2101(1,77,768) -MatMul_805:MatMul*input:onnx_3A__3A_MatMul_5F_2101(1,77,768);onnx_3A__3A_MatMul_5F_2837.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2106(1,77,768) -Add_806:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2106(1,77,768)*output:onnx_3A__3A_Mul_5F_2107(1,77,768) -Mul_808:Mul*input:onnx_3A__3A_Mul_5F_2107(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_43(1,77,768) -MatMul_809:MatMul*input:onnx_3A__3A_MatMul_5F_2101(1,77,768);onnx_3A__3A_MatMul_5F_2838.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2111(1,77,768) -Add_810:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2111(1,77,768)*output:onnx_3A__3A_Reshape_5F_2112(1,77,768) -Reshape_811:Reshape*input:onnx_3A__3A_Reshape_5F_2112(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2125(1,77,12,64)*allowzero:0 -Transpose_812:Transpose*input:onnx_3A__3A_Transpose_5F_2125(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_2126(1,12,77,64)*perm:0,2,1,3 -MatMul_813:MatMul*input:onnx_3A__3A_MatMul_5F_2101(1,77,768);onnx_3A__3A_MatMul_5F_2844.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2128(1,77,768) -Add_814:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2128(1,77,768)*output:onnx_3A__3A_Reshape_5F_2129(1,77,768) -Reshape_815:Reshape*input:onnx_3A__3A_Reshape_5F_2129(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2142(1,77,12,64)*allowzero:0 -Transpose_816:Transpose*input:onnx_3A__3A_Transpose_5F_2142(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_2143(1,12,77,64)*perm:0,2,1,3 -Reshape_817:Reshape*input:query_5F_states_2E_43(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2156(1,77,12,64)*allowzero:0 -Transpose_818:Transpose*input:onnx_3A__3A_Transpose_5F_2156(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_2157(1,12,77,64)*perm:0,2,1,3 -Reshape_819:Reshape*input:onnx_3A__3A_Reshape_5F_2157(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2167(12,77,64)*allowzero:0 -Reshape_820:Reshape*input:onnx_3A__3A_Reshape_5F_2126(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_2177(12,77,64)*allowzero:0 -Reshape_821:Reshape*input:onnx_3A__3A_Reshape_5F_2143(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2187(12,77,64)*allowzero:0 -Transpose_822:Transpose*input:onnx_3A__3A_Transpose_5F_2177(12,77,64)*output:onnx_3A__3A_MatMul_5F_2189(12,64,77)*perm:0,2,1 -MatMul_823:MatMul*input:onnx_3A__3A_MatMul_5F_2167(12,77,64);onnx_3A__3A_MatMul_5F_2189(12,64,77)*output:onnx_3A__3A_Reshape_5F_2190(12,77,77) -Reshape_824:Reshape*input:onnx_3A__3A_Reshape_5F_2190(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_2201(1,12,77,77)*allowzero:0 -Add_825:Add*input:onnx_3A__3A_Add_5F_2201(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_2202(1,12,77,77) -Reshape_826:Reshape*input:onnx_3A__3A_Reshape_5F_2202(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_87(12,77,77)*allowzero:0 -Softmax_827:Softmax*input:attn_5F_weights_2E_87(12,77,77)*output:attn_5F_weights_2E_91(12,77,77)*axis:-1 -MatMul_828:MatMul*input:attn_5F_weights_2E_91(12,77,77);onnx_3A__3A_MatMul_5F_2187(12,77,64)*output:onnx_3A__3A_Reshape_5F_2213(12,77,64) -Reshape_829:Reshape*input:onnx_3A__3A_Reshape_5F_2213(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2225(1,12,77,64)*allowzero:0 -Transpose_830:Transpose*input:onnx_3A__3A_Transpose_5F_2225(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_2226(1,77,12,64)*perm:0,2,1,3 -Reshape_831:Reshape*input:onnx_3A__3A_Reshape_5F_2226(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2234(1,77,768)*allowzero:0 -MatMul_832:MatMul*input:onnx_3A__3A_MatMul_5F_2234(1,77,768);onnx_3A__3A_MatMul_5F_2885.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2236(1,77,768) -Add_833:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2236(1,77,768)*output:onnx_3A__3A_Add_5F_2237(1,77,768) -Add_834:Add*input:input_2E_95(1,77,768);onnx_3A__3A_Add_5F_2237(1,77,768)*output:input_2E_99(1,77,768) -ReduceMean_835:ReduceMean*input:input_2E_99(1,77,768)*output:onnx_3A__3A_Sub_5F_2239(1,77,1)*axes:-1 -Sub_836:Sub*input:input_2E_99(1,77,768);onnx_3A__3A_Sub_5F_2239(1,77,1)*output:onnx_3A__3A_Pow_5F_2240(1,77,768) -Pow_838:Pow*input:onnx_3A__3A_Pow_5F_2240(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_2242(1,77,768) -ReduceMean_839:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_2242(1,77,768)*output:onnx_3A__3A_Add_5F_2243(1,77,1)*axes:-1 -Add_841:Add*input:onnx_3A__3A_Add_5F_2243(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_2245(1,77,1) -Sqrt_842:Sqrt*input:onnx_3A__3A_Sqrt_5F_2245(1,77,1)*output:onnx_3A__3A_Div_5F_2246(1,77,1) -Div_843:Div*input:onnx_3A__3A_Pow_5F_2240(1,77,768);onnx_3A__3A_Div_5F_2246(1,77,1)*output:onnx_3A__3A_Mul_5F_2247(1,77,768) -Mul_844:Mul*input:onnx_3A__3A_Mul_5F_2247(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_2248(1,77,768) -Add_845:Add*input:onnx_3A__3A_Add_5F_2248(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_2249(1,77,768) -MatMul_846:MatMul*input:onnx_3A__3A_MatMul_5F_2249(1,77,768);onnx_3A__3A_MatMul_5F_2886.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_2251(1,77,3072) -Add_847:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_2251(1,77,3072)*output:onnx_3A__3A_Mul_5F_2252(1,77,3072) -Mul_849:Mul*input:onnx_3A__3A_Mul_5F_2252(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_2254(1,77,3072) -Sigmoid_850:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_2254(1,77,3072)*output:onnx_3A__3A_Mul_5F_2255(1,77,3072) -Mul_851:Mul*input:onnx_3A__3A_Mul_5F_2252(1,77,3072);onnx_3A__3A_Mul_5F_2255(1,77,3072)*output:onnx_3A__3A_MatMul_5F_2256(1,77,3072) -MatMul_852:MatMul*input:onnx_3A__3A_MatMul_5F_2256(1,77,3072);onnx_3A__3A_MatMul_5F_2887.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_2258(1,77,768) -Add_853:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2258(1,77,768)*output:onnx_3A__3A_Add_5F_2259(1,77,768) -Add_854:Add*input:input_2E_99(1,77,768);onnx_3A__3A_Add_5F_2259(1,77,768)*output:input_2E_103(1,77,768) -ReduceMean_855:ReduceMean*input:input_2E_103(1,77,768)*output:onnx_3A__3A_Sub_5F_2261(1,77,1)*axes:-1 -Sub_856:Sub*input:input_2E_103(1,77,768);onnx_3A__3A_Sub_5F_2261(1,77,1)*output:onnx_3A__3A_Pow_5F_2262(1,77,768) -Pow_858:Pow*input:onnx_3A__3A_Pow_5F_2262(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_2264(1,77,768) -ReduceMean_859:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_2264(1,77,768)*output:onnx_3A__3A_Add_5F_2265(1,77,1)*axes:-1 -Add_861:Add*input:onnx_3A__3A_Add_5F_2265(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_2267(1,77,1) -Sqrt_862:Sqrt*input:onnx_3A__3A_Sqrt_5F_2267(1,77,1)*output:onnx_3A__3A_Div_5F_2268(1,77,1) -Div_863:Div*input:onnx_3A__3A_Pow_5F_2262(1,77,768);onnx_3A__3A_Div_5F_2268(1,77,1)*output:onnx_3A__3A_Mul_5F_2269(1,77,768) -Mul_864:Mul*input:onnx_3A__3A_Mul_5F_2269(1,77,768);text_5F_model_2E_final_5F_layer_5F_norm_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_2270(1,77,768) -Add_865:Add*input:onnx_3A__3A_Add_5F_2270(1,77,768);text_5F_model_2E_final_5F_layer_5F_norm_2E_bias.bin(float32:768)*output:2271(1,77,768) +Reshape_113:Reshape*input:onnx_3A__3A_Reshape_5F_0(1,77);onnx_3A__3A_Reshape_5F_2274.bin(int64:2)*output:input(1,77)*allowzero:0 +Gather_114:Gather*input:text_5F_model_2E_embeddings_2E_token_5F_embedding_2E_wrapped_2E_weight.bin(float32:49408,768);input(1,77)*output:onnx_3A__3A_Add_5F_212(1,77,768) +Add_116:Add*input:onnx_3A__3A_Add_5F_212(1,77,768);onnx_3A__3A_Add_5F_213.bin(float32:1,77,768)*output:input_2E_7(1,77,768) +ReduceMean_123:ReduceMean*input:input_2E_7(1,77,768)*output:onnx_3A__3A_Sub_5F_221(1,77,1)*axes:-1 +Sub_124:Sub*input:input_2E_7(1,77,768);onnx_3A__3A_Sub_5F_221(1,77,1)*output:onnx_3A__3A_Pow_5F_222(1,77,768) +Pow_126:Pow*input:onnx_3A__3A_Pow_5F_222(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_224(1,77,768) +ReduceMean_127:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_224(1,77,768)*output:onnx_3A__3A_Add_5F_225(1,77,1)*axes:-1 +Add_129:Add*input:onnx_3A__3A_Add_5F_225(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_227(1,77,1) +Sqrt_130:Sqrt*input:onnx_3A__3A_Sqrt_5F_227(1,77,1)*output:onnx_3A__3A_Div_5F_228(1,77,1) +Div_131:Div*input:onnx_3A__3A_Pow_5F_222(1,77,768);onnx_3A__3A_Div_5F_228(1,77,1)*output:onnx_3A__3A_Mul_5F_229(1,77,768) +Mul_132:Mul*input:onnx_3A__3A_Mul_5F_229(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_230(1,77,768) +Add_133:Add*input:onnx_3A__3A_Add_5F_230(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_231(1,77,768) +MatMul_134:MatMul*input:onnx_3A__3A_MatMul_5F_231(1,77,768);onnx_3A__3A_MatMul_5F_2276.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_236(1,77,768) +Add_135:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_236(1,77,768)*output:onnx_3A__3A_Mul_5F_237(1,77,768) +Mul_137:Mul*input:onnx_3A__3A_Mul_5F_237(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states(1,77,768) +MatMul_138:MatMul*input:onnx_3A__3A_MatMul_5F_231(1,77,768);onnx_3A__3A_MatMul_5F_2277.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_241(1,77,768) +Add_139:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_241(1,77,768)*output:onnx_3A__3A_Reshape_5F_242(1,77,768) +Reshape_140:Reshape*input:onnx_3A__3A_Reshape_5F_242(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_255(1,77,12,64)*allowzero:0 +Transpose_141:Transpose*input:onnx_3A__3A_Transpose_5F_255(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_256(1,12,77,64)*perm:0,2,1,3 +MatMul_142:MatMul*input:onnx_3A__3A_MatMul_5F_231(1,77,768);onnx_3A__3A_MatMul_5F_2283.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_258(1,77,768) +Add_143:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_258(1,77,768)*output:onnx_3A__3A_Reshape_5F_259(1,77,768) +Reshape_144:Reshape*input:onnx_3A__3A_Reshape_5F_259(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_272(1,77,12,64)*allowzero:0 +Transpose_145:Transpose*input:onnx_3A__3A_Transpose_5F_272(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_273(1,12,77,64)*perm:0,2,1,3 +Reshape_146:Reshape*input:query_5F_states(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_286(1,77,12,64)*allowzero:0 +Transpose_147:Transpose*input:onnx_3A__3A_Transpose_5F_286(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_287(1,12,77,64)*perm:0,2,1,3 +Reshape_148:Reshape*input:onnx_3A__3A_Reshape_5F_287(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_297(12,77,64)*allowzero:0 +Reshape_149:Reshape*input:onnx_3A__3A_Reshape_5F_256(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_307(12,77,64)*allowzero:0 +Reshape_150:Reshape*input:onnx_3A__3A_Reshape_5F_273(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_317(12,77,64)*allowzero:0 +Transpose_151:Transpose*input:onnx_3A__3A_Transpose_5F_307(12,77,64)*output:onnx_3A__3A_MatMul_5F_319(12,64,77)*perm:0,2,1 +MatMul_152:MatMul*input:onnx_3A__3A_MatMul_5F_297(12,77,64);onnx_3A__3A_MatMul_5F_319(12,64,77)*output:onnx_3A__3A_Reshape_5F_320(12,77,77) +Reshape_153:Reshape*input:onnx_3A__3A_Reshape_5F_320(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_331(1,12,77,77)*allowzero:0 +Add_154:Add*input:onnx_3A__3A_Add_5F_331(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_332(1,12,77,77) +Reshape_155:Reshape*input:onnx_3A__3A_Reshape_5F_332(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights(12,77,77)*allowzero:0 +Softmax_156:Softmax*input:attn_5F_weights(12,77,77)*output:attn_5F_weights_2E_3(12,77,77)*axis:-1 +MatMul_157:MatMul*input:attn_5F_weights_2E_3(12,77,77);onnx_3A__3A_MatMul_5F_317(12,77,64)*output:onnx_3A__3A_Reshape_5F_343(12,77,64) +Reshape_158:Reshape*input:onnx_3A__3A_Reshape_5F_343(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_355(1,12,77,64)*allowzero:0 +Transpose_159:Transpose*input:onnx_3A__3A_Transpose_5F_355(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_356(1,77,12,64)*perm:0,2,1,3 +Reshape_160:Reshape*input:onnx_3A__3A_Reshape_5F_356(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_364(1,77,768)*allowzero:0 +MatMul_161:MatMul*input:onnx_3A__3A_MatMul_5F_364(1,77,768);onnx_3A__3A_MatMul_5F_2324.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_366(1,77,768) +Add_162:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_366(1,77,768)*output:onnx_3A__3A_Add_5F_367(1,77,768) +Add_163:Add*input:input_2E_7(1,77,768);onnx_3A__3A_Add_5F_367(1,77,768)*output:input_2E_11(1,77,768) +ReduceMean_164:ReduceMean*input:input_2E_11(1,77,768)*output:onnx_3A__3A_Sub_5F_369(1,77,1)*axes:-1 +Sub_165:Sub*input:input_2E_11(1,77,768);onnx_3A__3A_Sub_5F_369(1,77,1)*output:onnx_3A__3A_Pow_5F_370(1,77,768) +Pow_167:Pow*input:onnx_3A__3A_Pow_5F_370(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_372(1,77,768) +ReduceMean_168:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_372(1,77,768)*output:onnx_3A__3A_Add_5F_373(1,77,1)*axes:-1 +Add_170:Add*input:onnx_3A__3A_Add_5F_373(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_375(1,77,1) +Sqrt_171:Sqrt*input:onnx_3A__3A_Sqrt_5F_375(1,77,1)*output:onnx_3A__3A_Div_5F_376(1,77,1) +Div_172:Div*input:onnx_3A__3A_Pow_5F_370(1,77,768);onnx_3A__3A_Div_5F_376(1,77,1)*output:onnx_3A__3A_Mul_5F_377(1,77,768) +Mul_173:Mul*input:onnx_3A__3A_Mul_5F_377(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_378(1,77,768) +Add_174:Add*input:onnx_3A__3A_Add_5F_378(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_0_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_379(1,77,768) +MatMul_175:MatMul*input:onnx_3A__3A_MatMul_5F_379(1,77,768);onnx_3A__3A_MatMul_5F_2325.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_381(1,77,3072) +Add_176:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_381(1,77,3072)*output:onnx_3A__3A_Mul_5F_382(1,77,3072) +Mul_178:Mul*input:onnx_3A__3A_Mul_5F_382(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_384(1,77,3072) +Sigmoid_179:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_384(1,77,3072)*output:onnx_3A__3A_Mul_5F_385(1,77,3072) +Mul_180:Mul*input:onnx_3A__3A_Mul_5F_382(1,77,3072);onnx_3A__3A_Mul_5F_385(1,77,3072)*output:onnx_3A__3A_MatMul_5F_386(1,77,3072) +MatMul_181:MatMul*input:onnx_3A__3A_MatMul_5F_386(1,77,3072);onnx_3A__3A_MatMul_5F_2326.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_388(1,77,768) +Add_182:Add*input:text_5F_model_2E_encoder_2E_layers_2E_0_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_388(1,77,768)*output:onnx_3A__3A_Add_5F_389(1,77,768) +Add_183:Add*input:input_2E_11(1,77,768);onnx_3A__3A_Add_5F_389(1,77,768)*output:input_2E_15(1,77,768) +ReduceMean_184:ReduceMean*input:input_2E_15(1,77,768)*output:onnx_3A__3A_Sub_5F_391(1,77,1)*axes:-1 +Sub_185:Sub*input:input_2E_15(1,77,768);onnx_3A__3A_Sub_5F_391(1,77,1)*output:onnx_3A__3A_Pow_5F_392(1,77,768) +Pow_187:Pow*input:onnx_3A__3A_Pow_5F_392(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_394(1,77,768) +ReduceMean_188:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_394(1,77,768)*output:onnx_3A__3A_Add_5F_395(1,77,1)*axes:-1 +Add_190:Add*input:onnx_3A__3A_Add_5F_395(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_397(1,77,1) +Sqrt_191:Sqrt*input:onnx_3A__3A_Sqrt_5F_397(1,77,1)*output:onnx_3A__3A_Div_5F_398(1,77,1) +Div_192:Div*input:onnx_3A__3A_Pow_5F_392(1,77,768);onnx_3A__3A_Div_5F_398(1,77,1)*output:onnx_3A__3A_Mul_5F_399(1,77,768) +Mul_193:Mul*input:onnx_3A__3A_Mul_5F_399(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_400(1,77,768) +Add_194:Add*input:onnx_3A__3A_Add_5F_400(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_401(1,77,768) +MatMul_195:MatMul*input:onnx_3A__3A_MatMul_5F_401(1,77,768);onnx_3A__3A_MatMul_5F_2327.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_406(1,77,768) +Add_196:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_406(1,77,768)*output:onnx_3A__3A_Mul_5F_407(1,77,768) +Mul_198:Mul*input:onnx_3A__3A_Mul_5F_407(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_3(1,77,768) +MatMul_199:MatMul*input:onnx_3A__3A_MatMul_5F_401(1,77,768);onnx_3A__3A_MatMul_5F_2328.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_411(1,77,768) +Add_200:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_411(1,77,768)*output:onnx_3A__3A_Reshape_5F_412(1,77,768) +Reshape_201:Reshape*input:onnx_3A__3A_Reshape_5F_412(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_425(1,77,12,64)*allowzero:0 +Transpose_202:Transpose*input:onnx_3A__3A_Transpose_5F_425(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_426(1,12,77,64)*perm:0,2,1,3 +MatMul_203:MatMul*input:onnx_3A__3A_MatMul_5F_401(1,77,768);onnx_3A__3A_MatMul_5F_2334.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_428(1,77,768) +Add_204:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_428(1,77,768)*output:onnx_3A__3A_Reshape_5F_429(1,77,768) +Reshape_205:Reshape*input:onnx_3A__3A_Reshape_5F_429(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_442(1,77,12,64)*allowzero:0 +Transpose_206:Transpose*input:onnx_3A__3A_Transpose_5F_442(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_443(1,12,77,64)*perm:0,2,1,3 +Reshape_207:Reshape*input:query_5F_states_2E_3(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_456(1,77,12,64)*allowzero:0 +Transpose_208:Transpose*input:onnx_3A__3A_Transpose_5F_456(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_457(1,12,77,64)*perm:0,2,1,3 +Reshape_209:Reshape*input:onnx_3A__3A_Reshape_5F_457(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_467(12,77,64)*allowzero:0 +Reshape_210:Reshape*input:onnx_3A__3A_Reshape_5F_426(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_477(12,77,64)*allowzero:0 +Reshape_211:Reshape*input:onnx_3A__3A_Reshape_5F_443(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_487(12,77,64)*allowzero:0 +Transpose_212:Transpose*input:onnx_3A__3A_Transpose_5F_477(12,77,64)*output:onnx_3A__3A_MatMul_5F_489(12,64,77)*perm:0,2,1 +MatMul_213:MatMul*input:onnx_3A__3A_MatMul_5F_467(12,77,64);onnx_3A__3A_MatMul_5F_489(12,64,77)*output:onnx_3A__3A_Reshape_5F_490(12,77,77) +Reshape_214:Reshape*input:onnx_3A__3A_Reshape_5F_490(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_501(1,12,77,77)*allowzero:0 +Add_215:Add*input:onnx_3A__3A_Add_5F_501(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_502(1,12,77,77) +Reshape_216:Reshape*input:onnx_3A__3A_Reshape_5F_502(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_7(12,77,77)*allowzero:0 +Softmax_217:Softmax*input:attn_5F_weights_2E_7(12,77,77)*output:attn_5F_weights_2E_11(12,77,77)*axis:-1 +MatMul_218:MatMul*input:attn_5F_weights_2E_11(12,77,77);onnx_3A__3A_MatMul_5F_487(12,77,64)*output:onnx_3A__3A_Reshape_5F_513(12,77,64) +Reshape_219:Reshape*input:onnx_3A__3A_Reshape_5F_513(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_525(1,12,77,64)*allowzero:0 +Transpose_220:Transpose*input:onnx_3A__3A_Transpose_5F_525(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_526(1,77,12,64)*perm:0,2,1,3 +Reshape_221:Reshape*input:onnx_3A__3A_Reshape_5F_526(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_534(1,77,768)*allowzero:0 +MatMul_222:MatMul*input:onnx_3A__3A_MatMul_5F_534(1,77,768);onnx_3A__3A_MatMul_5F_2375.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_536(1,77,768) +Add_223:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_536(1,77,768)*output:onnx_3A__3A_Add_5F_537(1,77,768) +Add_224:Add*input:input_2E_15(1,77,768);onnx_3A__3A_Add_5F_537(1,77,768)*output:input_2E_19(1,77,768) +ReduceMean_225:ReduceMean*input:input_2E_19(1,77,768)*output:onnx_3A__3A_Sub_5F_539(1,77,1)*axes:-1 +Sub_226:Sub*input:input_2E_19(1,77,768);onnx_3A__3A_Sub_5F_539(1,77,1)*output:onnx_3A__3A_Pow_5F_540(1,77,768) +Pow_228:Pow*input:onnx_3A__3A_Pow_5F_540(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_542(1,77,768) +ReduceMean_229:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_542(1,77,768)*output:onnx_3A__3A_Add_5F_543(1,77,1)*axes:-1 +Add_231:Add*input:onnx_3A__3A_Add_5F_543(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_545(1,77,1) +Sqrt_232:Sqrt*input:onnx_3A__3A_Sqrt_5F_545(1,77,1)*output:onnx_3A__3A_Div_5F_546(1,77,1) +Div_233:Div*input:onnx_3A__3A_Pow_5F_540(1,77,768);onnx_3A__3A_Div_5F_546(1,77,1)*output:onnx_3A__3A_Mul_5F_547(1,77,768) +Mul_234:Mul*input:onnx_3A__3A_Mul_5F_547(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_548(1,77,768) +Add_235:Add*input:onnx_3A__3A_Add_5F_548(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_1_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_549(1,77,768) +MatMul_236:MatMul*input:onnx_3A__3A_MatMul_5F_549(1,77,768);onnx_3A__3A_MatMul_5F_2376.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_551(1,77,3072) +Add_237:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_551(1,77,3072)*output:onnx_3A__3A_Mul_5F_552(1,77,3072) +Mul_239:Mul*input:onnx_3A__3A_Mul_5F_552(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_554(1,77,3072) +Sigmoid_240:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_554(1,77,3072)*output:onnx_3A__3A_Mul_5F_555(1,77,3072) +Mul_241:Mul*input:onnx_3A__3A_Mul_5F_552(1,77,3072);onnx_3A__3A_Mul_5F_555(1,77,3072)*output:onnx_3A__3A_MatMul_5F_556(1,77,3072) +MatMul_242:MatMul*input:onnx_3A__3A_MatMul_5F_556(1,77,3072);onnx_3A__3A_MatMul_5F_2377.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_558(1,77,768) +Add_243:Add*input:text_5F_model_2E_encoder_2E_layers_2E_1_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_558(1,77,768)*output:onnx_3A__3A_Add_5F_559(1,77,768) +Add_244:Add*input:input_2E_19(1,77,768);onnx_3A__3A_Add_5F_559(1,77,768)*output:input_2E_23(1,77,768) +ReduceMean_245:ReduceMean*input:input_2E_23(1,77,768)*output:onnx_3A__3A_Sub_5F_561(1,77,1)*axes:-1 +Sub_246:Sub*input:input_2E_23(1,77,768);onnx_3A__3A_Sub_5F_561(1,77,1)*output:onnx_3A__3A_Pow_5F_562(1,77,768) +Pow_248:Pow*input:onnx_3A__3A_Pow_5F_562(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_564(1,77,768) +ReduceMean_249:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_564(1,77,768)*output:onnx_3A__3A_Add_5F_565(1,77,1)*axes:-1 +Add_251:Add*input:onnx_3A__3A_Add_5F_565(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_567(1,77,1) +Sqrt_252:Sqrt*input:onnx_3A__3A_Sqrt_5F_567(1,77,1)*output:onnx_3A__3A_Div_5F_568(1,77,1) +Div_253:Div*input:onnx_3A__3A_Pow_5F_562(1,77,768);onnx_3A__3A_Div_5F_568(1,77,1)*output:onnx_3A__3A_Mul_5F_569(1,77,768) +Mul_254:Mul*input:onnx_3A__3A_Mul_5F_569(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_570(1,77,768) +Add_255:Add*input:onnx_3A__3A_Add_5F_570(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_571(1,77,768) +MatMul_256:MatMul*input:onnx_3A__3A_MatMul_5F_571(1,77,768);onnx_3A__3A_MatMul_5F_2378.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_576(1,77,768) +Add_257:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_576(1,77,768)*output:onnx_3A__3A_Mul_5F_577(1,77,768) +Mul_259:Mul*input:onnx_3A__3A_Mul_5F_577(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_7(1,77,768) +MatMul_260:MatMul*input:onnx_3A__3A_MatMul_5F_571(1,77,768);onnx_3A__3A_MatMul_5F_2379.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_581(1,77,768) +Add_261:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_581(1,77,768)*output:onnx_3A__3A_Reshape_5F_582(1,77,768) +Reshape_262:Reshape*input:onnx_3A__3A_Reshape_5F_582(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_595(1,77,12,64)*allowzero:0 +Transpose_263:Transpose*input:onnx_3A__3A_Transpose_5F_595(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_596(1,12,77,64)*perm:0,2,1,3 +MatMul_264:MatMul*input:onnx_3A__3A_MatMul_5F_571(1,77,768);onnx_3A__3A_MatMul_5F_2385.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_598(1,77,768) +Add_265:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_598(1,77,768)*output:onnx_3A__3A_Reshape_5F_599(1,77,768) +Reshape_266:Reshape*input:onnx_3A__3A_Reshape_5F_599(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_612(1,77,12,64)*allowzero:0 +Transpose_267:Transpose*input:onnx_3A__3A_Transpose_5F_612(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_613(1,12,77,64)*perm:0,2,1,3 +Reshape_268:Reshape*input:query_5F_states_2E_7(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_626(1,77,12,64)*allowzero:0 +Transpose_269:Transpose*input:onnx_3A__3A_Transpose_5F_626(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_627(1,12,77,64)*perm:0,2,1,3 +Reshape_270:Reshape*input:onnx_3A__3A_Reshape_5F_627(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_637(12,77,64)*allowzero:0 +Reshape_271:Reshape*input:onnx_3A__3A_Reshape_5F_596(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_647(12,77,64)*allowzero:0 +Reshape_272:Reshape*input:onnx_3A__3A_Reshape_5F_613(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_657(12,77,64)*allowzero:0 +Transpose_273:Transpose*input:onnx_3A__3A_Transpose_5F_647(12,77,64)*output:onnx_3A__3A_MatMul_5F_659(12,64,77)*perm:0,2,1 +MatMul_274:MatMul*input:onnx_3A__3A_MatMul_5F_637(12,77,64);onnx_3A__3A_MatMul_5F_659(12,64,77)*output:onnx_3A__3A_Reshape_5F_660(12,77,77) +Reshape_275:Reshape*input:onnx_3A__3A_Reshape_5F_660(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_671(1,12,77,77)*allowzero:0 +Add_276:Add*input:onnx_3A__3A_Add_5F_671(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_672(1,12,77,77) +Reshape_277:Reshape*input:onnx_3A__3A_Reshape_5F_672(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_15(12,77,77)*allowzero:0 +Softmax_278:Softmax*input:attn_5F_weights_2E_15(12,77,77)*output:attn_5F_weights_2E_19(12,77,77)*axis:-1 +MatMul_279:MatMul*input:attn_5F_weights_2E_19(12,77,77);onnx_3A__3A_MatMul_5F_657(12,77,64)*output:onnx_3A__3A_Reshape_5F_683(12,77,64) +Reshape_280:Reshape*input:onnx_3A__3A_Reshape_5F_683(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_695(1,12,77,64)*allowzero:0 +Transpose_281:Transpose*input:onnx_3A__3A_Transpose_5F_695(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_696(1,77,12,64)*perm:0,2,1,3 +Reshape_282:Reshape*input:onnx_3A__3A_Reshape_5F_696(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_704(1,77,768)*allowzero:0 +MatMul_283:MatMul*input:onnx_3A__3A_MatMul_5F_704(1,77,768);onnx_3A__3A_MatMul_5F_2426.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_706(1,77,768) +Add_284:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_706(1,77,768)*output:onnx_3A__3A_Add_5F_707(1,77,768) +Add_285:Add*input:input_2E_23(1,77,768);onnx_3A__3A_Add_5F_707(1,77,768)*output:input_2E_27(1,77,768) +ReduceMean_286:ReduceMean*input:input_2E_27(1,77,768)*output:onnx_3A__3A_Sub_5F_709(1,77,1)*axes:-1 +Sub_287:Sub*input:input_2E_27(1,77,768);onnx_3A__3A_Sub_5F_709(1,77,1)*output:onnx_3A__3A_Pow_5F_710(1,77,768) +Pow_289:Pow*input:onnx_3A__3A_Pow_5F_710(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_712(1,77,768) +ReduceMean_290:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_712(1,77,768)*output:onnx_3A__3A_Add_5F_713(1,77,1)*axes:-1 +Add_292:Add*input:onnx_3A__3A_Add_5F_713(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_715(1,77,1) +Sqrt_293:Sqrt*input:onnx_3A__3A_Sqrt_5F_715(1,77,1)*output:onnx_3A__3A_Div_5F_716(1,77,1) +Div_294:Div*input:onnx_3A__3A_Pow_5F_710(1,77,768);onnx_3A__3A_Div_5F_716(1,77,1)*output:onnx_3A__3A_Mul_5F_717(1,77,768) +Mul_295:Mul*input:onnx_3A__3A_Mul_5F_717(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_718(1,77,768) +Add_296:Add*input:onnx_3A__3A_Add_5F_718(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_2_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_719(1,77,768) +MatMul_297:MatMul*input:onnx_3A__3A_MatMul_5F_719(1,77,768);onnx_3A__3A_MatMul_5F_2427.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_721(1,77,3072) +Add_298:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_721(1,77,3072)*output:onnx_3A__3A_Mul_5F_722(1,77,3072) +Mul_300:Mul*input:onnx_3A__3A_Mul_5F_722(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_724(1,77,3072) +Sigmoid_301:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_724(1,77,3072)*output:onnx_3A__3A_Mul_5F_725(1,77,3072) +Mul_302:Mul*input:onnx_3A__3A_Mul_5F_722(1,77,3072);onnx_3A__3A_Mul_5F_725(1,77,3072)*output:onnx_3A__3A_MatMul_5F_726(1,77,3072) +MatMul_303:MatMul*input:onnx_3A__3A_MatMul_5F_726(1,77,3072);onnx_3A__3A_MatMul_5F_2428.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_728(1,77,768) +Add_304:Add*input:text_5F_model_2E_encoder_2E_layers_2E_2_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_728(1,77,768)*output:onnx_3A__3A_Add_5F_729(1,77,768) +Add_305:Add*input:input_2E_27(1,77,768);onnx_3A__3A_Add_5F_729(1,77,768)*output:input_2E_31(1,77,768) +ReduceMean_306:ReduceMean*input:input_2E_31(1,77,768)*output:onnx_3A__3A_Sub_5F_731(1,77,1)*axes:-1 +Sub_307:Sub*input:input_2E_31(1,77,768);onnx_3A__3A_Sub_5F_731(1,77,1)*output:onnx_3A__3A_Pow_5F_732(1,77,768) +Pow_309:Pow*input:onnx_3A__3A_Pow_5F_732(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_734(1,77,768) +ReduceMean_310:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_734(1,77,768)*output:onnx_3A__3A_Add_5F_735(1,77,1)*axes:-1 +Add_312:Add*input:onnx_3A__3A_Add_5F_735(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_737(1,77,1) +Sqrt_313:Sqrt*input:onnx_3A__3A_Sqrt_5F_737(1,77,1)*output:onnx_3A__3A_Div_5F_738(1,77,1) +Div_314:Div*input:onnx_3A__3A_Pow_5F_732(1,77,768);onnx_3A__3A_Div_5F_738(1,77,1)*output:onnx_3A__3A_Mul_5F_739(1,77,768) +Mul_315:Mul*input:onnx_3A__3A_Mul_5F_739(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_740(1,77,768) +Add_316:Add*input:onnx_3A__3A_Add_5F_740(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_741(1,77,768) +MatMul_317:MatMul*input:onnx_3A__3A_MatMul_5F_741(1,77,768);onnx_3A__3A_MatMul_5F_2429.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_746(1,77,768) +Add_318:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_746(1,77,768)*output:onnx_3A__3A_Mul_5F_747(1,77,768) +Mul_320:Mul*input:onnx_3A__3A_Mul_5F_747(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_11(1,77,768) +MatMul_321:MatMul*input:onnx_3A__3A_MatMul_5F_741(1,77,768);onnx_3A__3A_MatMul_5F_2430.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_751(1,77,768) +Add_322:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_751(1,77,768)*output:onnx_3A__3A_Reshape_5F_752(1,77,768) +Reshape_323:Reshape*input:onnx_3A__3A_Reshape_5F_752(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_765(1,77,12,64)*allowzero:0 +Transpose_324:Transpose*input:onnx_3A__3A_Transpose_5F_765(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_766(1,12,77,64)*perm:0,2,1,3 +MatMul_325:MatMul*input:onnx_3A__3A_MatMul_5F_741(1,77,768);onnx_3A__3A_MatMul_5F_2436.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_768(1,77,768) +Add_326:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_768(1,77,768)*output:onnx_3A__3A_Reshape_5F_769(1,77,768) +Reshape_327:Reshape*input:onnx_3A__3A_Reshape_5F_769(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_782(1,77,12,64)*allowzero:0 +Transpose_328:Transpose*input:onnx_3A__3A_Transpose_5F_782(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_783(1,12,77,64)*perm:0,2,1,3 +Reshape_329:Reshape*input:query_5F_states_2E_11(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_796(1,77,12,64)*allowzero:0 +Transpose_330:Transpose*input:onnx_3A__3A_Transpose_5F_796(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_797(1,12,77,64)*perm:0,2,1,3 +Reshape_331:Reshape*input:onnx_3A__3A_Reshape_5F_797(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_807(12,77,64)*allowzero:0 +Reshape_332:Reshape*input:onnx_3A__3A_Reshape_5F_766(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_817(12,77,64)*allowzero:0 +Reshape_333:Reshape*input:onnx_3A__3A_Reshape_5F_783(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_827(12,77,64)*allowzero:0 +Transpose_334:Transpose*input:onnx_3A__3A_Transpose_5F_817(12,77,64)*output:onnx_3A__3A_MatMul_5F_829(12,64,77)*perm:0,2,1 +MatMul_335:MatMul*input:onnx_3A__3A_MatMul_5F_807(12,77,64);onnx_3A__3A_MatMul_5F_829(12,64,77)*output:onnx_3A__3A_Reshape_5F_830(12,77,77) +Reshape_336:Reshape*input:onnx_3A__3A_Reshape_5F_830(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_841(1,12,77,77)*allowzero:0 +Add_337:Add*input:onnx_3A__3A_Add_5F_841(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_842(1,12,77,77) +Reshape_338:Reshape*input:onnx_3A__3A_Reshape_5F_842(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_23(12,77,77)*allowzero:0 +Softmax_339:Softmax*input:attn_5F_weights_2E_23(12,77,77)*output:attn_5F_weights_2E_27(12,77,77)*axis:-1 +MatMul_340:MatMul*input:attn_5F_weights_2E_27(12,77,77);onnx_3A__3A_MatMul_5F_827(12,77,64)*output:onnx_3A__3A_Reshape_5F_853(12,77,64) +Reshape_341:Reshape*input:onnx_3A__3A_Reshape_5F_853(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_865(1,12,77,64)*allowzero:0 +Transpose_342:Transpose*input:onnx_3A__3A_Transpose_5F_865(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_866(1,77,12,64)*perm:0,2,1,3 +Reshape_343:Reshape*input:onnx_3A__3A_Reshape_5F_866(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_874(1,77,768)*allowzero:0 +MatMul_344:MatMul*input:onnx_3A__3A_MatMul_5F_874(1,77,768);onnx_3A__3A_MatMul_5F_2477.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_876(1,77,768) +Add_345:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_876(1,77,768)*output:onnx_3A__3A_Add_5F_877(1,77,768) +Add_346:Add*input:input_2E_31(1,77,768);onnx_3A__3A_Add_5F_877(1,77,768)*output:input_2E_35(1,77,768) +ReduceMean_347:ReduceMean*input:input_2E_35(1,77,768)*output:onnx_3A__3A_Sub_5F_879(1,77,1)*axes:-1 +Sub_348:Sub*input:input_2E_35(1,77,768);onnx_3A__3A_Sub_5F_879(1,77,1)*output:onnx_3A__3A_Pow_5F_880(1,77,768) +Pow_350:Pow*input:onnx_3A__3A_Pow_5F_880(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_882(1,77,768) +ReduceMean_351:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_882(1,77,768)*output:onnx_3A__3A_Add_5F_883(1,77,1)*axes:-1 +Add_353:Add*input:onnx_3A__3A_Add_5F_883(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_885(1,77,1) +Sqrt_354:Sqrt*input:onnx_3A__3A_Sqrt_5F_885(1,77,1)*output:onnx_3A__3A_Div_5F_886(1,77,1) +Div_355:Div*input:onnx_3A__3A_Pow_5F_880(1,77,768);onnx_3A__3A_Div_5F_886(1,77,1)*output:onnx_3A__3A_Mul_5F_887(1,77,768) +Mul_356:Mul*input:onnx_3A__3A_Mul_5F_887(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_888(1,77,768) +Add_357:Add*input:onnx_3A__3A_Add_5F_888(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_3_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_889(1,77,768) +MatMul_358:MatMul*input:onnx_3A__3A_MatMul_5F_889(1,77,768);onnx_3A__3A_MatMul_5F_2478.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_891(1,77,3072) +Add_359:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_891(1,77,3072)*output:onnx_3A__3A_Mul_5F_892(1,77,3072) +Mul_361:Mul*input:onnx_3A__3A_Mul_5F_892(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_894(1,77,3072) +Sigmoid_362:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_894(1,77,3072)*output:onnx_3A__3A_Mul_5F_895(1,77,3072) +Mul_363:Mul*input:onnx_3A__3A_Mul_5F_892(1,77,3072);onnx_3A__3A_Mul_5F_895(1,77,3072)*output:onnx_3A__3A_MatMul_5F_896(1,77,3072) +MatMul_364:MatMul*input:onnx_3A__3A_MatMul_5F_896(1,77,3072);onnx_3A__3A_MatMul_5F_2479.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_898(1,77,768) +Add_365:Add*input:text_5F_model_2E_encoder_2E_layers_2E_3_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_898(1,77,768)*output:onnx_3A__3A_Add_5F_899(1,77,768) +Add_366:Add*input:input_2E_35(1,77,768);onnx_3A__3A_Add_5F_899(1,77,768)*output:input_2E_39(1,77,768) +ReduceMean_367:ReduceMean*input:input_2E_39(1,77,768)*output:onnx_3A__3A_Sub_5F_901(1,77,1)*axes:-1 +Sub_368:Sub*input:input_2E_39(1,77,768);onnx_3A__3A_Sub_5F_901(1,77,1)*output:onnx_3A__3A_Pow_5F_902(1,77,768) +Pow_370:Pow*input:onnx_3A__3A_Pow_5F_902(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_904(1,77,768) +ReduceMean_371:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_904(1,77,768)*output:onnx_3A__3A_Add_5F_905(1,77,1)*axes:-1 +Add_373:Add*input:onnx_3A__3A_Add_5F_905(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_907(1,77,1) +Sqrt_374:Sqrt*input:onnx_3A__3A_Sqrt_5F_907(1,77,1)*output:onnx_3A__3A_Div_5F_908(1,77,1) +Div_375:Div*input:onnx_3A__3A_Pow_5F_902(1,77,768);onnx_3A__3A_Div_5F_908(1,77,1)*output:onnx_3A__3A_Mul_5F_909(1,77,768) +Mul_376:Mul*input:onnx_3A__3A_Mul_5F_909(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_910(1,77,768) +Add_377:Add*input:onnx_3A__3A_Add_5F_910(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_911(1,77,768) +MatMul_378:MatMul*input:onnx_3A__3A_MatMul_5F_911(1,77,768);onnx_3A__3A_MatMul_5F_2480.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_916(1,77,768) +Add_379:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_916(1,77,768)*output:onnx_3A__3A_Mul_5F_917(1,77,768) +Mul_381:Mul*input:onnx_3A__3A_Mul_5F_917(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_15(1,77,768) +MatMul_382:MatMul*input:onnx_3A__3A_MatMul_5F_911(1,77,768);onnx_3A__3A_MatMul_5F_2481.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_921(1,77,768) +Add_383:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_921(1,77,768)*output:onnx_3A__3A_Reshape_5F_922(1,77,768) +Reshape_384:Reshape*input:onnx_3A__3A_Reshape_5F_922(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_935(1,77,12,64)*allowzero:0 +Transpose_385:Transpose*input:onnx_3A__3A_Transpose_5F_935(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_936(1,12,77,64)*perm:0,2,1,3 +MatMul_386:MatMul*input:onnx_3A__3A_MatMul_5F_911(1,77,768);onnx_3A__3A_MatMul_5F_2487.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_938(1,77,768) +Add_387:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_938(1,77,768)*output:onnx_3A__3A_Reshape_5F_939(1,77,768) +Reshape_388:Reshape*input:onnx_3A__3A_Reshape_5F_939(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_952(1,77,12,64)*allowzero:0 +Transpose_389:Transpose*input:onnx_3A__3A_Transpose_5F_952(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_953(1,12,77,64)*perm:0,2,1,3 +Reshape_390:Reshape*input:query_5F_states_2E_15(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_966(1,77,12,64)*allowzero:0 +Transpose_391:Transpose*input:onnx_3A__3A_Transpose_5F_966(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_967(1,12,77,64)*perm:0,2,1,3 +Reshape_392:Reshape*input:onnx_3A__3A_Reshape_5F_967(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_977(12,77,64)*allowzero:0 +Reshape_393:Reshape*input:onnx_3A__3A_Reshape_5F_936(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_987(12,77,64)*allowzero:0 +Reshape_394:Reshape*input:onnx_3A__3A_Reshape_5F_953(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_997(12,77,64)*allowzero:0 +Transpose_395:Transpose*input:onnx_3A__3A_Transpose_5F_987(12,77,64)*output:onnx_3A__3A_MatMul_5F_999(12,64,77)*perm:0,2,1 +MatMul_396:MatMul*input:onnx_3A__3A_MatMul_5F_977(12,77,64);onnx_3A__3A_MatMul_5F_999(12,64,77)*output:onnx_3A__3A_Reshape_5F_1000(12,77,77) +Reshape_397:Reshape*input:onnx_3A__3A_Reshape_5F_1000(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1011(1,12,77,77)*allowzero:0 +Add_398:Add*input:onnx_3A__3A_Add_5F_1011(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1012(1,12,77,77) +Reshape_399:Reshape*input:onnx_3A__3A_Reshape_5F_1012(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_31(12,77,77)*allowzero:0 +Softmax_400:Softmax*input:attn_5F_weights_2E_31(12,77,77)*output:attn_5F_weights_2E_35(12,77,77)*axis:-1 +MatMul_401:MatMul*input:attn_5F_weights_2E_35(12,77,77);onnx_3A__3A_MatMul_5F_997(12,77,64)*output:onnx_3A__3A_Reshape_5F_1023(12,77,64) +Reshape_402:Reshape*input:onnx_3A__3A_Reshape_5F_1023(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1035(1,12,77,64)*allowzero:0 +Transpose_403:Transpose*input:onnx_3A__3A_Transpose_5F_1035(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1036(1,77,12,64)*perm:0,2,1,3 +Reshape_404:Reshape*input:onnx_3A__3A_Reshape_5F_1036(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1044(1,77,768)*allowzero:0 +MatMul_405:MatMul*input:onnx_3A__3A_MatMul_5F_1044(1,77,768);onnx_3A__3A_MatMul_5F_2528.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1046(1,77,768) +Add_406:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1046(1,77,768)*output:onnx_3A__3A_Add_5F_1047(1,77,768) +Add_407:Add*input:input_2E_39(1,77,768);onnx_3A__3A_Add_5F_1047(1,77,768)*output:input_2E_43(1,77,768) +ReduceMean_408:ReduceMean*input:input_2E_43(1,77,768)*output:onnx_3A__3A_Sub_5F_1049(1,77,1)*axes:-1 +Sub_409:Sub*input:input_2E_43(1,77,768);onnx_3A__3A_Sub_5F_1049(1,77,1)*output:onnx_3A__3A_Pow_5F_1050(1,77,768) +Pow_411:Pow*input:onnx_3A__3A_Pow_5F_1050(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1052(1,77,768) +ReduceMean_412:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1052(1,77,768)*output:onnx_3A__3A_Add_5F_1053(1,77,1)*axes:-1 +Add_414:Add*input:onnx_3A__3A_Add_5F_1053(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1055(1,77,1) +Sqrt_415:Sqrt*input:onnx_3A__3A_Sqrt_5F_1055(1,77,1)*output:onnx_3A__3A_Div_5F_1056(1,77,1) +Div_416:Div*input:onnx_3A__3A_Pow_5F_1050(1,77,768);onnx_3A__3A_Div_5F_1056(1,77,1)*output:onnx_3A__3A_Mul_5F_1057(1,77,768) +Mul_417:Mul*input:onnx_3A__3A_Mul_5F_1057(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1058(1,77,768) +Add_418:Add*input:onnx_3A__3A_Add_5F_1058(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_4_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1059(1,77,768) +MatMul_419:MatMul*input:onnx_3A__3A_MatMul_5F_1059(1,77,768);onnx_3A__3A_MatMul_5F_2529.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1061(1,77,3072) +Add_420:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1061(1,77,3072)*output:onnx_3A__3A_Mul_5F_1062(1,77,3072) +Mul_422:Mul*input:onnx_3A__3A_Mul_5F_1062(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1064(1,77,3072) +Sigmoid_423:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1064(1,77,3072)*output:onnx_3A__3A_Mul_5F_1065(1,77,3072) +Mul_424:Mul*input:onnx_3A__3A_Mul_5F_1062(1,77,3072);onnx_3A__3A_Mul_5F_1065(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1066(1,77,3072) +MatMul_425:MatMul*input:onnx_3A__3A_MatMul_5F_1066(1,77,3072);onnx_3A__3A_MatMul_5F_2530.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1068(1,77,768) +Add_426:Add*input:text_5F_model_2E_encoder_2E_layers_2E_4_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1068(1,77,768)*output:onnx_3A__3A_Add_5F_1069(1,77,768) +Add_427:Add*input:input_2E_43(1,77,768);onnx_3A__3A_Add_5F_1069(1,77,768)*output:input_2E_47(1,77,768) +ReduceMean_428:ReduceMean*input:input_2E_47(1,77,768)*output:onnx_3A__3A_Sub_5F_1071(1,77,1)*axes:-1 +Sub_429:Sub*input:input_2E_47(1,77,768);onnx_3A__3A_Sub_5F_1071(1,77,1)*output:onnx_3A__3A_Pow_5F_1072(1,77,768) +Pow_431:Pow*input:onnx_3A__3A_Pow_5F_1072(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1074(1,77,768) +ReduceMean_432:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1074(1,77,768)*output:onnx_3A__3A_Add_5F_1075(1,77,1)*axes:-1 +Add_434:Add*input:onnx_3A__3A_Add_5F_1075(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1077(1,77,1) +Sqrt_435:Sqrt*input:onnx_3A__3A_Sqrt_5F_1077(1,77,1)*output:onnx_3A__3A_Div_5F_1078(1,77,1) +Div_436:Div*input:onnx_3A__3A_Pow_5F_1072(1,77,768);onnx_3A__3A_Div_5F_1078(1,77,1)*output:onnx_3A__3A_Mul_5F_1079(1,77,768) +Mul_437:Mul*input:onnx_3A__3A_Mul_5F_1079(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1080(1,77,768) +Add_438:Add*input:onnx_3A__3A_Add_5F_1080(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1081(1,77,768) +MatMul_439:MatMul*input:onnx_3A__3A_MatMul_5F_1081(1,77,768);onnx_3A__3A_MatMul_5F_2531.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1086(1,77,768) +Add_440:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1086(1,77,768)*output:onnx_3A__3A_Mul_5F_1087(1,77,768) +Mul_442:Mul*input:onnx_3A__3A_Mul_5F_1087(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_19(1,77,768) +MatMul_443:MatMul*input:onnx_3A__3A_MatMul_5F_1081(1,77,768);onnx_3A__3A_MatMul_5F_2532.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1091(1,77,768) +Add_444:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1091(1,77,768)*output:onnx_3A__3A_Reshape_5F_1092(1,77,768) +Reshape_445:Reshape*input:onnx_3A__3A_Reshape_5F_1092(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1105(1,77,12,64)*allowzero:0 +Transpose_446:Transpose*input:onnx_3A__3A_Transpose_5F_1105(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1106(1,12,77,64)*perm:0,2,1,3 +MatMul_447:MatMul*input:onnx_3A__3A_MatMul_5F_1081(1,77,768);onnx_3A__3A_MatMul_5F_2538.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1108(1,77,768) +Add_448:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1108(1,77,768)*output:onnx_3A__3A_Reshape_5F_1109(1,77,768) +Reshape_449:Reshape*input:onnx_3A__3A_Reshape_5F_1109(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1122(1,77,12,64)*allowzero:0 +Transpose_450:Transpose*input:onnx_3A__3A_Transpose_5F_1122(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1123(1,12,77,64)*perm:0,2,1,3 +Reshape_451:Reshape*input:query_5F_states_2E_19(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1136(1,77,12,64)*allowzero:0 +Transpose_452:Transpose*input:onnx_3A__3A_Transpose_5F_1136(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1137(1,12,77,64)*perm:0,2,1,3 +Reshape_453:Reshape*input:onnx_3A__3A_Reshape_5F_1137(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1147(12,77,64)*allowzero:0 +Reshape_454:Reshape*input:onnx_3A__3A_Reshape_5F_1106(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1157(12,77,64)*allowzero:0 +Reshape_455:Reshape*input:onnx_3A__3A_Reshape_5F_1123(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1167(12,77,64)*allowzero:0 +Transpose_456:Transpose*input:onnx_3A__3A_Transpose_5F_1157(12,77,64)*output:onnx_3A__3A_MatMul_5F_1169(12,64,77)*perm:0,2,1 +MatMul_457:MatMul*input:onnx_3A__3A_MatMul_5F_1147(12,77,64);onnx_3A__3A_MatMul_5F_1169(12,64,77)*output:onnx_3A__3A_Reshape_5F_1170(12,77,77) +Reshape_458:Reshape*input:onnx_3A__3A_Reshape_5F_1170(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1181(1,12,77,77)*allowzero:0 +Add_459:Add*input:onnx_3A__3A_Add_5F_1181(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1182(1,12,77,77) +Reshape_460:Reshape*input:onnx_3A__3A_Reshape_5F_1182(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_39(12,77,77)*allowzero:0 +Softmax_461:Softmax*input:attn_5F_weights_2E_39(12,77,77)*output:attn_5F_weights_2E_43(12,77,77)*axis:-1 +MatMul_462:MatMul*input:attn_5F_weights_2E_43(12,77,77);onnx_3A__3A_MatMul_5F_1167(12,77,64)*output:onnx_3A__3A_Reshape_5F_1193(12,77,64) +Reshape_463:Reshape*input:onnx_3A__3A_Reshape_5F_1193(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1205(1,12,77,64)*allowzero:0 +Transpose_464:Transpose*input:onnx_3A__3A_Transpose_5F_1205(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1206(1,77,12,64)*perm:0,2,1,3 +Reshape_465:Reshape*input:onnx_3A__3A_Reshape_5F_1206(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1214(1,77,768)*allowzero:0 +MatMul_466:MatMul*input:onnx_3A__3A_MatMul_5F_1214(1,77,768);onnx_3A__3A_MatMul_5F_2579.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1216(1,77,768) +Add_467:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1216(1,77,768)*output:onnx_3A__3A_Add_5F_1217(1,77,768) +Add_468:Add*input:input_2E_47(1,77,768);onnx_3A__3A_Add_5F_1217(1,77,768)*output:input_2E_51(1,77,768) +ReduceMean_469:ReduceMean*input:input_2E_51(1,77,768)*output:onnx_3A__3A_Sub_5F_1219(1,77,1)*axes:-1 +Sub_470:Sub*input:input_2E_51(1,77,768);onnx_3A__3A_Sub_5F_1219(1,77,1)*output:onnx_3A__3A_Pow_5F_1220(1,77,768) +Pow_472:Pow*input:onnx_3A__3A_Pow_5F_1220(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1222(1,77,768) +ReduceMean_473:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1222(1,77,768)*output:onnx_3A__3A_Add_5F_1223(1,77,1)*axes:-1 +Add_475:Add*input:onnx_3A__3A_Add_5F_1223(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1225(1,77,1) +Sqrt_476:Sqrt*input:onnx_3A__3A_Sqrt_5F_1225(1,77,1)*output:onnx_3A__3A_Div_5F_1226(1,77,1) +Div_477:Div*input:onnx_3A__3A_Pow_5F_1220(1,77,768);onnx_3A__3A_Div_5F_1226(1,77,1)*output:onnx_3A__3A_Mul_5F_1227(1,77,768) +Mul_478:Mul*input:onnx_3A__3A_Mul_5F_1227(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1228(1,77,768) +Add_479:Add*input:onnx_3A__3A_Add_5F_1228(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_5_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1229(1,77,768) +MatMul_480:MatMul*input:onnx_3A__3A_MatMul_5F_1229(1,77,768);onnx_3A__3A_MatMul_5F_2580.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1231(1,77,3072) +Add_481:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1231(1,77,3072)*output:onnx_3A__3A_Mul_5F_1232(1,77,3072) +Mul_483:Mul*input:onnx_3A__3A_Mul_5F_1232(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1234(1,77,3072) +Sigmoid_484:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1234(1,77,3072)*output:onnx_3A__3A_Mul_5F_1235(1,77,3072) +Mul_485:Mul*input:onnx_3A__3A_Mul_5F_1232(1,77,3072);onnx_3A__3A_Mul_5F_1235(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1236(1,77,3072) +MatMul_486:MatMul*input:onnx_3A__3A_MatMul_5F_1236(1,77,3072);onnx_3A__3A_MatMul_5F_2581.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1238(1,77,768) +Add_487:Add*input:text_5F_model_2E_encoder_2E_layers_2E_5_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1238(1,77,768)*output:onnx_3A__3A_Add_5F_1239(1,77,768) +Add_488:Add*input:input_2E_51(1,77,768);onnx_3A__3A_Add_5F_1239(1,77,768)*output:input_2E_55(1,77,768) +ReduceMean_489:ReduceMean*input:input_2E_55(1,77,768)*output:onnx_3A__3A_Sub_5F_1241(1,77,1)*axes:-1 +Sub_490:Sub*input:input_2E_55(1,77,768);onnx_3A__3A_Sub_5F_1241(1,77,1)*output:onnx_3A__3A_Pow_5F_1242(1,77,768) +Pow_492:Pow*input:onnx_3A__3A_Pow_5F_1242(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1244(1,77,768) +ReduceMean_493:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1244(1,77,768)*output:onnx_3A__3A_Add_5F_1245(1,77,1)*axes:-1 +Add_495:Add*input:onnx_3A__3A_Add_5F_1245(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1247(1,77,1) +Sqrt_496:Sqrt*input:onnx_3A__3A_Sqrt_5F_1247(1,77,1)*output:onnx_3A__3A_Div_5F_1248(1,77,1) +Div_497:Div*input:onnx_3A__3A_Pow_5F_1242(1,77,768);onnx_3A__3A_Div_5F_1248(1,77,1)*output:onnx_3A__3A_Mul_5F_1249(1,77,768) +Mul_498:Mul*input:onnx_3A__3A_Mul_5F_1249(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1250(1,77,768) +Add_499:Add*input:onnx_3A__3A_Add_5F_1250(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1251(1,77,768) +MatMul_500:MatMul*input:onnx_3A__3A_MatMul_5F_1251(1,77,768);onnx_3A__3A_MatMul_5F_2582.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1256(1,77,768) +Add_501:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1256(1,77,768)*output:onnx_3A__3A_Mul_5F_1257(1,77,768) +Mul_503:Mul*input:onnx_3A__3A_Mul_5F_1257(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_23(1,77,768) +MatMul_504:MatMul*input:onnx_3A__3A_MatMul_5F_1251(1,77,768);onnx_3A__3A_MatMul_5F_2583.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1261(1,77,768) +Add_505:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1261(1,77,768)*output:onnx_3A__3A_Reshape_5F_1262(1,77,768) +Reshape_506:Reshape*input:onnx_3A__3A_Reshape_5F_1262(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1275(1,77,12,64)*allowzero:0 +Transpose_507:Transpose*input:onnx_3A__3A_Transpose_5F_1275(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1276(1,12,77,64)*perm:0,2,1,3 +MatMul_508:MatMul*input:onnx_3A__3A_MatMul_5F_1251(1,77,768);onnx_3A__3A_MatMul_5F_2589.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1278(1,77,768) +Add_509:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1278(1,77,768)*output:onnx_3A__3A_Reshape_5F_1279(1,77,768) +Reshape_510:Reshape*input:onnx_3A__3A_Reshape_5F_1279(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1292(1,77,12,64)*allowzero:0 +Transpose_511:Transpose*input:onnx_3A__3A_Transpose_5F_1292(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1293(1,12,77,64)*perm:0,2,1,3 +Reshape_512:Reshape*input:query_5F_states_2E_23(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1306(1,77,12,64)*allowzero:0 +Transpose_513:Transpose*input:onnx_3A__3A_Transpose_5F_1306(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1307(1,12,77,64)*perm:0,2,1,3 +Reshape_514:Reshape*input:onnx_3A__3A_Reshape_5F_1307(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1317(12,77,64)*allowzero:0 +Reshape_515:Reshape*input:onnx_3A__3A_Reshape_5F_1276(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1327(12,77,64)*allowzero:0 +Reshape_516:Reshape*input:onnx_3A__3A_Reshape_5F_1293(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1337(12,77,64)*allowzero:0 +Transpose_517:Transpose*input:onnx_3A__3A_Transpose_5F_1327(12,77,64)*output:onnx_3A__3A_MatMul_5F_1339(12,64,77)*perm:0,2,1 +MatMul_518:MatMul*input:onnx_3A__3A_MatMul_5F_1317(12,77,64);onnx_3A__3A_MatMul_5F_1339(12,64,77)*output:onnx_3A__3A_Reshape_5F_1340(12,77,77) +Reshape_519:Reshape*input:onnx_3A__3A_Reshape_5F_1340(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1351(1,12,77,77)*allowzero:0 +Add_520:Add*input:onnx_3A__3A_Add_5F_1351(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1352(1,12,77,77) +Reshape_521:Reshape*input:onnx_3A__3A_Reshape_5F_1352(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_47(12,77,77)*allowzero:0 +Softmax_522:Softmax*input:attn_5F_weights_2E_47(12,77,77)*output:attn_5F_weights_2E_51(12,77,77)*axis:-1 +MatMul_523:MatMul*input:attn_5F_weights_2E_51(12,77,77);onnx_3A__3A_MatMul_5F_1337(12,77,64)*output:onnx_3A__3A_Reshape_5F_1363(12,77,64) +Reshape_524:Reshape*input:onnx_3A__3A_Reshape_5F_1363(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1375(1,12,77,64)*allowzero:0 +Transpose_525:Transpose*input:onnx_3A__3A_Transpose_5F_1375(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1376(1,77,12,64)*perm:0,2,1,3 +Reshape_526:Reshape*input:onnx_3A__3A_Reshape_5F_1376(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1384(1,77,768)*allowzero:0 +MatMul_527:MatMul*input:onnx_3A__3A_MatMul_5F_1384(1,77,768);onnx_3A__3A_MatMul_5F_2630.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1386(1,77,768) +Add_528:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1386(1,77,768)*output:onnx_3A__3A_Add_5F_1387(1,77,768) +Add_529:Add*input:input_2E_55(1,77,768);onnx_3A__3A_Add_5F_1387(1,77,768)*output:input_2E_59(1,77,768) +ReduceMean_530:ReduceMean*input:input_2E_59(1,77,768)*output:onnx_3A__3A_Sub_5F_1389(1,77,1)*axes:-1 +Sub_531:Sub*input:input_2E_59(1,77,768);onnx_3A__3A_Sub_5F_1389(1,77,1)*output:onnx_3A__3A_Pow_5F_1390(1,77,768) +Pow_533:Pow*input:onnx_3A__3A_Pow_5F_1390(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1392(1,77,768) +ReduceMean_534:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1392(1,77,768)*output:onnx_3A__3A_Add_5F_1393(1,77,1)*axes:-1 +Add_536:Add*input:onnx_3A__3A_Add_5F_1393(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1395(1,77,1) +Sqrt_537:Sqrt*input:onnx_3A__3A_Sqrt_5F_1395(1,77,1)*output:onnx_3A__3A_Div_5F_1396(1,77,1) +Div_538:Div*input:onnx_3A__3A_Pow_5F_1390(1,77,768);onnx_3A__3A_Div_5F_1396(1,77,1)*output:onnx_3A__3A_Mul_5F_1397(1,77,768) +Mul_539:Mul*input:onnx_3A__3A_Mul_5F_1397(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1398(1,77,768) +Add_540:Add*input:onnx_3A__3A_Add_5F_1398(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_6_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1399(1,77,768) +MatMul_541:MatMul*input:onnx_3A__3A_MatMul_5F_1399(1,77,768);onnx_3A__3A_MatMul_5F_2631.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1401(1,77,3072) +Add_542:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1401(1,77,3072)*output:onnx_3A__3A_Mul_5F_1402(1,77,3072) +Mul_544:Mul*input:onnx_3A__3A_Mul_5F_1402(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1404(1,77,3072) +Sigmoid_545:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1404(1,77,3072)*output:onnx_3A__3A_Mul_5F_1405(1,77,3072) +Mul_546:Mul*input:onnx_3A__3A_Mul_5F_1402(1,77,3072);onnx_3A__3A_Mul_5F_1405(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1406(1,77,3072) +MatMul_547:MatMul*input:onnx_3A__3A_MatMul_5F_1406(1,77,3072);onnx_3A__3A_MatMul_5F_2632.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1408(1,77,768) +Add_548:Add*input:text_5F_model_2E_encoder_2E_layers_2E_6_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1408(1,77,768)*output:onnx_3A__3A_Add_5F_1409(1,77,768) +Add_549:Add*input:input_2E_59(1,77,768);onnx_3A__3A_Add_5F_1409(1,77,768)*output:input_2E_63(1,77,768) +ReduceMean_550:ReduceMean*input:input_2E_63(1,77,768)*output:onnx_3A__3A_Sub_5F_1411(1,77,1)*axes:-1 +Sub_551:Sub*input:input_2E_63(1,77,768);onnx_3A__3A_Sub_5F_1411(1,77,1)*output:onnx_3A__3A_Pow_5F_1412(1,77,768) +Pow_553:Pow*input:onnx_3A__3A_Pow_5F_1412(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1414(1,77,768) +ReduceMean_554:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1414(1,77,768)*output:onnx_3A__3A_Add_5F_1415(1,77,1)*axes:-1 +Add_556:Add*input:onnx_3A__3A_Add_5F_1415(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1417(1,77,1) +Sqrt_557:Sqrt*input:onnx_3A__3A_Sqrt_5F_1417(1,77,1)*output:onnx_3A__3A_Div_5F_1418(1,77,1) +Div_558:Div*input:onnx_3A__3A_Pow_5F_1412(1,77,768);onnx_3A__3A_Div_5F_1418(1,77,1)*output:onnx_3A__3A_Mul_5F_1419(1,77,768) +Mul_559:Mul*input:onnx_3A__3A_Mul_5F_1419(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1420(1,77,768) +Add_560:Add*input:onnx_3A__3A_Add_5F_1420(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1421(1,77,768) +MatMul_561:MatMul*input:onnx_3A__3A_MatMul_5F_1421(1,77,768);onnx_3A__3A_MatMul_5F_2633.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1426(1,77,768) +Add_562:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1426(1,77,768)*output:onnx_3A__3A_Mul_5F_1427(1,77,768) +Mul_564:Mul*input:onnx_3A__3A_Mul_5F_1427(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_27(1,77,768) +MatMul_565:MatMul*input:onnx_3A__3A_MatMul_5F_1421(1,77,768);onnx_3A__3A_MatMul_5F_2634.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1431(1,77,768) +Add_566:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1431(1,77,768)*output:onnx_3A__3A_Reshape_5F_1432(1,77,768) +Reshape_567:Reshape*input:onnx_3A__3A_Reshape_5F_1432(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1445(1,77,12,64)*allowzero:0 +Transpose_568:Transpose*input:onnx_3A__3A_Transpose_5F_1445(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1446(1,12,77,64)*perm:0,2,1,3 +MatMul_569:MatMul*input:onnx_3A__3A_MatMul_5F_1421(1,77,768);onnx_3A__3A_MatMul_5F_2640.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1448(1,77,768) +Add_570:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1448(1,77,768)*output:onnx_3A__3A_Reshape_5F_1449(1,77,768) +Reshape_571:Reshape*input:onnx_3A__3A_Reshape_5F_1449(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1462(1,77,12,64)*allowzero:0 +Transpose_572:Transpose*input:onnx_3A__3A_Transpose_5F_1462(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1463(1,12,77,64)*perm:0,2,1,3 +Reshape_573:Reshape*input:query_5F_states_2E_27(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1476(1,77,12,64)*allowzero:0 +Transpose_574:Transpose*input:onnx_3A__3A_Transpose_5F_1476(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1477(1,12,77,64)*perm:0,2,1,3 +Reshape_575:Reshape*input:onnx_3A__3A_Reshape_5F_1477(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1487(12,77,64)*allowzero:0 +Reshape_576:Reshape*input:onnx_3A__3A_Reshape_5F_1446(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1497(12,77,64)*allowzero:0 +Reshape_577:Reshape*input:onnx_3A__3A_Reshape_5F_1463(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1507(12,77,64)*allowzero:0 +Transpose_578:Transpose*input:onnx_3A__3A_Transpose_5F_1497(12,77,64)*output:onnx_3A__3A_MatMul_5F_1509(12,64,77)*perm:0,2,1 +MatMul_579:MatMul*input:onnx_3A__3A_MatMul_5F_1487(12,77,64);onnx_3A__3A_MatMul_5F_1509(12,64,77)*output:onnx_3A__3A_Reshape_5F_1510(12,77,77) +Reshape_580:Reshape*input:onnx_3A__3A_Reshape_5F_1510(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1521(1,12,77,77)*allowzero:0 +Add_581:Add*input:onnx_3A__3A_Add_5F_1521(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1522(1,12,77,77) +Reshape_582:Reshape*input:onnx_3A__3A_Reshape_5F_1522(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_55(12,77,77)*allowzero:0 +Softmax_583:Softmax*input:attn_5F_weights_2E_55(12,77,77)*output:attn_5F_weights_2E_59(12,77,77)*axis:-1 +MatMul_584:MatMul*input:attn_5F_weights_2E_59(12,77,77);onnx_3A__3A_MatMul_5F_1507(12,77,64)*output:onnx_3A__3A_Reshape_5F_1533(12,77,64) +Reshape_585:Reshape*input:onnx_3A__3A_Reshape_5F_1533(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1545(1,12,77,64)*allowzero:0 +Transpose_586:Transpose*input:onnx_3A__3A_Transpose_5F_1545(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1546(1,77,12,64)*perm:0,2,1,3 +Reshape_587:Reshape*input:onnx_3A__3A_Reshape_5F_1546(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1554(1,77,768)*allowzero:0 +MatMul_588:MatMul*input:onnx_3A__3A_MatMul_5F_1554(1,77,768);onnx_3A__3A_MatMul_5F_2681.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1556(1,77,768) +Add_589:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1556(1,77,768)*output:onnx_3A__3A_Add_5F_1557(1,77,768) +Add_590:Add*input:input_2E_63(1,77,768);onnx_3A__3A_Add_5F_1557(1,77,768)*output:input_2E_67(1,77,768) +ReduceMean_591:ReduceMean*input:input_2E_67(1,77,768)*output:onnx_3A__3A_Sub_5F_1559(1,77,1)*axes:-1 +Sub_592:Sub*input:input_2E_67(1,77,768);onnx_3A__3A_Sub_5F_1559(1,77,1)*output:onnx_3A__3A_Pow_5F_1560(1,77,768) +Pow_594:Pow*input:onnx_3A__3A_Pow_5F_1560(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1562(1,77,768) +ReduceMean_595:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1562(1,77,768)*output:onnx_3A__3A_Add_5F_1563(1,77,1)*axes:-1 +Add_597:Add*input:onnx_3A__3A_Add_5F_1563(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1565(1,77,1) +Sqrt_598:Sqrt*input:onnx_3A__3A_Sqrt_5F_1565(1,77,1)*output:onnx_3A__3A_Div_5F_1566(1,77,1) +Div_599:Div*input:onnx_3A__3A_Pow_5F_1560(1,77,768);onnx_3A__3A_Div_5F_1566(1,77,1)*output:onnx_3A__3A_Mul_5F_1567(1,77,768) +Mul_600:Mul*input:onnx_3A__3A_Mul_5F_1567(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1568(1,77,768) +Add_601:Add*input:onnx_3A__3A_Add_5F_1568(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_7_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1569(1,77,768) +MatMul_602:MatMul*input:onnx_3A__3A_MatMul_5F_1569(1,77,768);onnx_3A__3A_MatMul_5F_2682.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1571(1,77,3072) +Add_603:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1571(1,77,3072)*output:onnx_3A__3A_Mul_5F_1572(1,77,3072) +Mul_605:Mul*input:onnx_3A__3A_Mul_5F_1572(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1574(1,77,3072) +Sigmoid_606:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1574(1,77,3072)*output:onnx_3A__3A_Mul_5F_1575(1,77,3072) +Mul_607:Mul*input:onnx_3A__3A_Mul_5F_1572(1,77,3072);onnx_3A__3A_Mul_5F_1575(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1576(1,77,3072) +MatMul_608:MatMul*input:onnx_3A__3A_MatMul_5F_1576(1,77,3072);onnx_3A__3A_MatMul_5F_2683.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1578(1,77,768) +Add_609:Add*input:text_5F_model_2E_encoder_2E_layers_2E_7_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1578(1,77,768)*output:onnx_3A__3A_Add_5F_1579(1,77,768) +Add_610:Add*input:input_2E_67(1,77,768);onnx_3A__3A_Add_5F_1579(1,77,768)*output:input_2E_71(1,77,768) +ReduceMean_611:ReduceMean*input:input_2E_71(1,77,768)*output:onnx_3A__3A_Sub_5F_1581(1,77,1)*axes:-1 +Sub_612:Sub*input:input_2E_71(1,77,768);onnx_3A__3A_Sub_5F_1581(1,77,1)*output:onnx_3A__3A_Pow_5F_1582(1,77,768) +Pow_614:Pow*input:onnx_3A__3A_Pow_5F_1582(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1584(1,77,768) +ReduceMean_615:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1584(1,77,768)*output:onnx_3A__3A_Add_5F_1585(1,77,1)*axes:-1 +Add_617:Add*input:onnx_3A__3A_Add_5F_1585(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1587(1,77,1) +Sqrt_618:Sqrt*input:onnx_3A__3A_Sqrt_5F_1587(1,77,1)*output:onnx_3A__3A_Div_5F_1588(1,77,1) +Div_619:Div*input:onnx_3A__3A_Pow_5F_1582(1,77,768);onnx_3A__3A_Div_5F_1588(1,77,1)*output:onnx_3A__3A_Mul_5F_1589(1,77,768) +Mul_620:Mul*input:onnx_3A__3A_Mul_5F_1589(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1590(1,77,768) +Add_621:Add*input:onnx_3A__3A_Add_5F_1590(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1591(1,77,768) +MatMul_622:MatMul*input:onnx_3A__3A_MatMul_5F_1591(1,77,768);onnx_3A__3A_MatMul_5F_2684.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1596(1,77,768) +Add_623:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1596(1,77,768)*output:onnx_3A__3A_Mul_5F_1597(1,77,768) +Mul_625:Mul*input:onnx_3A__3A_Mul_5F_1597(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_31(1,77,768) +MatMul_626:MatMul*input:onnx_3A__3A_MatMul_5F_1591(1,77,768);onnx_3A__3A_MatMul_5F_2685.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1601(1,77,768) +Add_627:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1601(1,77,768)*output:onnx_3A__3A_Reshape_5F_1602(1,77,768) +Reshape_628:Reshape*input:onnx_3A__3A_Reshape_5F_1602(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1615(1,77,12,64)*allowzero:0 +Transpose_629:Transpose*input:onnx_3A__3A_Transpose_5F_1615(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1616(1,12,77,64)*perm:0,2,1,3 +MatMul_630:MatMul*input:onnx_3A__3A_MatMul_5F_1591(1,77,768);onnx_3A__3A_MatMul_5F_2691.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1618(1,77,768) +Add_631:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1618(1,77,768)*output:onnx_3A__3A_Reshape_5F_1619(1,77,768) +Reshape_632:Reshape*input:onnx_3A__3A_Reshape_5F_1619(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1632(1,77,12,64)*allowzero:0 +Transpose_633:Transpose*input:onnx_3A__3A_Transpose_5F_1632(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1633(1,12,77,64)*perm:0,2,1,3 +Reshape_634:Reshape*input:query_5F_states_2E_31(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1646(1,77,12,64)*allowzero:0 +Transpose_635:Transpose*input:onnx_3A__3A_Transpose_5F_1646(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1647(1,12,77,64)*perm:0,2,1,3 +Reshape_636:Reshape*input:onnx_3A__3A_Reshape_5F_1647(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1657(12,77,64)*allowzero:0 +Reshape_637:Reshape*input:onnx_3A__3A_Reshape_5F_1616(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1667(12,77,64)*allowzero:0 +Reshape_638:Reshape*input:onnx_3A__3A_Reshape_5F_1633(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1677(12,77,64)*allowzero:0 +Transpose_639:Transpose*input:onnx_3A__3A_Transpose_5F_1667(12,77,64)*output:onnx_3A__3A_MatMul_5F_1679(12,64,77)*perm:0,2,1 +MatMul_640:MatMul*input:onnx_3A__3A_MatMul_5F_1657(12,77,64);onnx_3A__3A_MatMul_5F_1679(12,64,77)*output:onnx_3A__3A_Reshape_5F_1680(12,77,77) +Reshape_641:Reshape*input:onnx_3A__3A_Reshape_5F_1680(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1691(1,12,77,77)*allowzero:0 +Add_642:Add*input:onnx_3A__3A_Add_5F_1691(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1692(1,12,77,77) +Reshape_643:Reshape*input:onnx_3A__3A_Reshape_5F_1692(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_63(12,77,77)*allowzero:0 +Softmax_644:Softmax*input:attn_5F_weights_2E_63(12,77,77)*output:attn_5F_weights_2E_67(12,77,77)*axis:-1 +MatMul_645:MatMul*input:attn_5F_weights_2E_67(12,77,77);onnx_3A__3A_MatMul_5F_1677(12,77,64)*output:onnx_3A__3A_Reshape_5F_1703(12,77,64) +Reshape_646:Reshape*input:onnx_3A__3A_Reshape_5F_1703(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1715(1,12,77,64)*allowzero:0 +Transpose_647:Transpose*input:onnx_3A__3A_Transpose_5F_1715(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1716(1,77,12,64)*perm:0,2,1,3 +Reshape_648:Reshape*input:onnx_3A__3A_Reshape_5F_1716(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1724(1,77,768)*allowzero:0 +MatMul_649:MatMul*input:onnx_3A__3A_MatMul_5F_1724(1,77,768);onnx_3A__3A_MatMul_5F_2732.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1726(1,77,768) +Add_650:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1726(1,77,768)*output:onnx_3A__3A_Add_5F_1727(1,77,768) +Add_651:Add*input:input_2E_71(1,77,768);onnx_3A__3A_Add_5F_1727(1,77,768)*output:input_2E_75(1,77,768) +ReduceMean_652:ReduceMean*input:input_2E_75(1,77,768)*output:onnx_3A__3A_Sub_5F_1729(1,77,1)*axes:-1 +Sub_653:Sub*input:input_2E_75(1,77,768);onnx_3A__3A_Sub_5F_1729(1,77,1)*output:onnx_3A__3A_Pow_5F_1730(1,77,768) +Pow_655:Pow*input:onnx_3A__3A_Pow_5F_1730(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1732(1,77,768) +ReduceMean_656:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1732(1,77,768)*output:onnx_3A__3A_Add_5F_1733(1,77,1)*axes:-1 +Add_658:Add*input:onnx_3A__3A_Add_5F_1733(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1735(1,77,1) +Sqrt_659:Sqrt*input:onnx_3A__3A_Sqrt_5F_1735(1,77,1)*output:onnx_3A__3A_Div_5F_1736(1,77,1) +Div_660:Div*input:onnx_3A__3A_Pow_5F_1730(1,77,768);onnx_3A__3A_Div_5F_1736(1,77,1)*output:onnx_3A__3A_Mul_5F_1737(1,77,768) +Mul_661:Mul*input:onnx_3A__3A_Mul_5F_1737(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1738(1,77,768) +Add_662:Add*input:onnx_3A__3A_Add_5F_1738(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_8_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1739(1,77,768) +MatMul_663:MatMul*input:onnx_3A__3A_MatMul_5F_1739(1,77,768);onnx_3A__3A_MatMul_5F_2733.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1741(1,77,3072) +Add_664:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1741(1,77,3072)*output:onnx_3A__3A_Mul_5F_1742(1,77,3072) +Mul_666:Mul*input:onnx_3A__3A_Mul_5F_1742(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1744(1,77,3072) +Sigmoid_667:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1744(1,77,3072)*output:onnx_3A__3A_Mul_5F_1745(1,77,3072) +Mul_668:Mul*input:onnx_3A__3A_Mul_5F_1742(1,77,3072);onnx_3A__3A_Mul_5F_1745(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1746(1,77,3072) +MatMul_669:MatMul*input:onnx_3A__3A_MatMul_5F_1746(1,77,3072);onnx_3A__3A_MatMul_5F_2734.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1748(1,77,768) +Add_670:Add*input:text_5F_model_2E_encoder_2E_layers_2E_8_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1748(1,77,768)*output:onnx_3A__3A_Add_5F_1749(1,77,768) +Add_671:Add*input:input_2E_75(1,77,768);onnx_3A__3A_Add_5F_1749(1,77,768)*output:input_2E_79(1,77,768) +ReduceMean_672:ReduceMean*input:input_2E_79(1,77,768)*output:onnx_3A__3A_Sub_5F_1751(1,77,1)*axes:-1 +Sub_673:Sub*input:input_2E_79(1,77,768);onnx_3A__3A_Sub_5F_1751(1,77,1)*output:onnx_3A__3A_Pow_5F_1752(1,77,768) +Pow_675:Pow*input:onnx_3A__3A_Pow_5F_1752(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1754(1,77,768) +ReduceMean_676:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1754(1,77,768)*output:onnx_3A__3A_Add_5F_1755(1,77,1)*axes:-1 +Add_678:Add*input:onnx_3A__3A_Add_5F_1755(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1757(1,77,1) +Sqrt_679:Sqrt*input:onnx_3A__3A_Sqrt_5F_1757(1,77,1)*output:onnx_3A__3A_Div_5F_1758(1,77,1) +Div_680:Div*input:onnx_3A__3A_Pow_5F_1752(1,77,768);onnx_3A__3A_Div_5F_1758(1,77,1)*output:onnx_3A__3A_Mul_5F_1759(1,77,768) +Mul_681:Mul*input:onnx_3A__3A_Mul_5F_1759(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1760(1,77,768) +Add_682:Add*input:onnx_3A__3A_Add_5F_1760(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1761(1,77,768) +MatMul_683:MatMul*input:onnx_3A__3A_MatMul_5F_1761(1,77,768);onnx_3A__3A_MatMul_5F_2735.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1766(1,77,768) +Add_684:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1766(1,77,768)*output:onnx_3A__3A_Mul_5F_1767(1,77,768) +Mul_686:Mul*input:onnx_3A__3A_Mul_5F_1767(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_35(1,77,768) +MatMul_687:MatMul*input:onnx_3A__3A_MatMul_5F_1761(1,77,768);onnx_3A__3A_MatMul_5F_2736.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1771(1,77,768) +Add_688:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1771(1,77,768)*output:onnx_3A__3A_Reshape_5F_1772(1,77,768) +Reshape_689:Reshape*input:onnx_3A__3A_Reshape_5F_1772(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1785(1,77,12,64)*allowzero:0 +Transpose_690:Transpose*input:onnx_3A__3A_Transpose_5F_1785(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1786(1,12,77,64)*perm:0,2,1,3 +MatMul_691:MatMul*input:onnx_3A__3A_MatMul_5F_1761(1,77,768);onnx_3A__3A_MatMul_5F_2742.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1788(1,77,768) +Add_692:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1788(1,77,768)*output:onnx_3A__3A_Reshape_5F_1789(1,77,768) +Reshape_693:Reshape*input:onnx_3A__3A_Reshape_5F_1789(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1802(1,77,12,64)*allowzero:0 +Transpose_694:Transpose*input:onnx_3A__3A_Transpose_5F_1802(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1803(1,12,77,64)*perm:0,2,1,3 +Reshape_695:Reshape*input:query_5F_states_2E_35(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1816(1,77,12,64)*allowzero:0 +Transpose_696:Transpose*input:onnx_3A__3A_Transpose_5F_1816(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1817(1,12,77,64)*perm:0,2,1,3 +Reshape_697:Reshape*input:onnx_3A__3A_Reshape_5F_1817(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1827(12,77,64)*allowzero:0 +Reshape_698:Reshape*input:onnx_3A__3A_Reshape_5F_1786(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_1837(12,77,64)*allowzero:0 +Reshape_699:Reshape*input:onnx_3A__3A_Reshape_5F_1803(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1847(12,77,64)*allowzero:0 +Transpose_700:Transpose*input:onnx_3A__3A_Transpose_5F_1837(12,77,64)*output:onnx_3A__3A_MatMul_5F_1849(12,64,77)*perm:0,2,1 +MatMul_701:MatMul*input:onnx_3A__3A_MatMul_5F_1827(12,77,64);onnx_3A__3A_MatMul_5F_1849(12,64,77)*output:onnx_3A__3A_Reshape_5F_1850(12,77,77) +Reshape_702:Reshape*input:onnx_3A__3A_Reshape_5F_1850(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_1861(1,12,77,77)*allowzero:0 +Add_703:Add*input:onnx_3A__3A_Add_5F_1861(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_1862(1,12,77,77) +Reshape_704:Reshape*input:onnx_3A__3A_Reshape_5F_1862(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_71(12,77,77)*allowzero:0 +Softmax_705:Softmax*input:attn_5F_weights_2E_71(12,77,77)*output:attn_5F_weights_2E_75(12,77,77)*axis:-1 +MatMul_706:MatMul*input:attn_5F_weights_2E_75(12,77,77);onnx_3A__3A_MatMul_5F_1847(12,77,64)*output:onnx_3A__3A_Reshape_5F_1873(12,77,64) +Reshape_707:Reshape*input:onnx_3A__3A_Reshape_5F_1873(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1885(1,12,77,64)*allowzero:0 +Transpose_708:Transpose*input:onnx_3A__3A_Transpose_5F_1885(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_1886(1,77,12,64)*perm:0,2,1,3 +Reshape_709:Reshape*input:onnx_3A__3A_Reshape_5F_1886(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1894(1,77,768)*allowzero:0 +MatMul_710:MatMul*input:onnx_3A__3A_MatMul_5F_1894(1,77,768);onnx_3A__3A_MatMul_5F_2783.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1896(1,77,768) +Add_711:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1896(1,77,768)*output:onnx_3A__3A_Add_5F_1897(1,77,768) +Add_712:Add*input:input_2E_79(1,77,768);onnx_3A__3A_Add_5F_1897(1,77,768)*output:input_2E_83(1,77,768) +ReduceMean_713:ReduceMean*input:input_2E_83(1,77,768)*output:onnx_3A__3A_Sub_5F_1899(1,77,1)*axes:-1 +Sub_714:Sub*input:input_2E_83(1,77,768);onnx_3A__3A_Sub_5F_1899(1,77,1)*output:onnx_3A__3A_Pow_5F_1900(1,77,768) +Pow_716:Pow*input:onnx_3A__3A_Pow_5F_1900(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1902(1,77,768) +ReduceMean_717:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1902(1,77,768)*output:onnx_3A__3A_Add_5F_1903(1,77,1)*axes:-1 +Add_719:Add*input:onnx_3A__3A_Add_5F_1903(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1905(1,77,1) +Sqrt_720:Sqrt*input:onnx_3A__3A_Sqrt_5F_1905(1,77,1)*output:onnx_3A__3A_Div_5F_1906(1,77,1) +Div_721:Div*input:onnx_3A__3A_Pow_5F_1900(1,77,768);onnx_3A__3A_Div_5F_1906(1,77,1)*output:onnx_3A__3A_Mul_5F_1907(1,77,768) +Mul_722:Mul*input:onnx_3A__3A_Mul_5F_1907(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1908(1,77,768) +Add_723:Add*input:onnx_3A__3A_Add_5F_1908(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_9_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1909(1,77,768) +MatMul_724:MatMul*input:onnx_3A__3A_MatMul_5F_1909(1,77,768);onnx_3A__3A_MatMul_5F_2784.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_1911(1,77,3072) +Add_725:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_1911(1,77,3072)*output:onnx_3A__3A_Mul_5F_1912(1,77,3072) +Mul_727:Mul*input:onnx_3A__3A_Mul_5F_1912(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_1914(1,77,3072) +Sigmoid_728:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_1914(1,77,3072)*output:onnx_3A__3A_Mul_5F_1915(1,77,3072) +Mul_729:Mul*input:onnx_3A__3A_Mul_5F_1912(1,77,3072);onnx_3A__3A_Mul_5F_1915(1,77,3072)*output:onnx_3A__3A_MatMul_5F_1916(1,77,3072) +MatMul_730:MatMul*input:onnx_3A__3A_MatMul_5F_1916(1,77,3072);onnx_3A__3A_MatMul_5F_2785.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_1918(1,77,768) +Add_731:Add*input:text_5F_model_2E_encoder_2E_layers_2E_9_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1918(1,77,768)*output:onnx_3A__3A_Add_5F_1919(1,77,768) +Add_732:Add*input:input_2E_83(1,77,768);onnx_3A__3A_Add_5F_1919(1,77,768)*output:input_2E_87(1,77,768) +ReduceMean_733:ReduceMean*input:input_2E_87(1,77,768)*output:onnx_3A__3A_Sub_5F_1921(1,77,1)*axes:-1 +Sub_734:Sub*input:input_2E_87(1,77,768);onnx_3A__3A_Sub_5F_1921(1,77,1)*output:onnx_3A__3A_Pow_5F_1922(1,77,768) +Pow_736:Pow*input:onnx_3A__3A_Pow_5F_1922(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_1924(1,77,768) +ReduceMean_737:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_1924(1,77,768)*output:onnx_3A__3A_Add_5F_1925(1,77,1)*axes:-1 +Add_739:Add*input:onnx_3A__3A_Add_5F_1925(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_1927(1,77,1) +Sqrt_740:Sqrt*input:onnx_3A__3A_Sqrt_5F_1927(1,77,1)*output:onnx_3A__3A_Div_5F_1928(1,77,1) +Div_741:Div*input:onnx_3A__3A_Pow_5F_1922(1,77,768);onnx_3A__3A_Div_5F_1928(1,77,1)*output:onnx_3A__3A_Mul_5F_1929(1,77,768) +Mul_742:Mul*input:onnx_3A__3A_Mul_5F_1929(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_1930(1,77,768) +Add_743:Add*input:onnx_3A__3A_Add_5F_1930(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_1931(1,77,768) +MatMul_744:MatMul*input:onnx_3A__3A_MatMul_5F_1931(1,77,768);onnx_3A__3A_MatMul_5F_2786.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1936(1,77,768) +Add_745:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1936(1,77,768)*output:onnx_3A__3A_Mul_5F_1937(1,77,768) +Mul_747:Mul*input:onnx_3A__3A_Mul_5F_1937(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_39(1,77,768) +MatMul_748:MatMul*input:onnx_3A__3A_MatMul_5F_1931(1,77,768);onnx_3A__3A_MatMul_5F_2787.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1941(1,77,768) +Add_749:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1941(1,77,768)*output:onnx_3A__3A_Reshape_5F_1942(1,77,768) +Reshape_750:Reshape*input:onnx_3A__3A_Reshape_5F_1942(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1955(1,77,12,64)*allowzero:0 +Transpose_751:Transpose*input:onnx_3A__3A_Transpose_5F_1955(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1956(1,12,77,64)*perm:0,2,1,3 +MatMul_752:MatMul*input:onnx_3A__3A_MatMul_5F_1931(1,77,768);onnx_3A__3A_MatMul_5F_2793.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_1958(1,77,768) +Add_753:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_1958(1,77,768)*output:onnx_3A__3A_Reshape_5F_1959(1,77,768) +Reshape_754:Reshape*input:onnx_3A__3A_Reshape_5F_1959(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1972(1,77,12,64)*allowzero:0 +Transpose_755:Transpose*input:onnx_3A__3A_Transpose_5F_1972(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1973(1,12,77,64)*perm:0,2,1,3 +Reshape_756:Reshape*input:query_5F_states_2E_39(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_1986(1,77,12,64)*allowzero:0 +Transpose_757:Transpose*input:onnx_3A__3A_Transpose_5F_1986(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_1987(1,12,77,64)*perm:0,2,1,3 +Reshape_758:Reshape*input:onnx_3A__3A_Reshape_5F_1987(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_1997(12,77,64)*allowzero:0 +Reshape_759:Reshape*input:onnx_3A__3A_Reshape_5F_1956(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_2007(12,77,64)*allowzero:0 +Reshape_760:Reshape*input:onnx_3A__3A_Reshape_5F_1973(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2017(12,77,64)*allowzero:0 +Transpose_761:Transpose*input:onnx_3A__3A_Transpose_5F_2007(12,77,64)*output:onnx_3A__3A_MatMul_5F_2019(12,64,77)*perm:0,2,1 +MatMul_762:MatMul*input:onnx_3A__3A_MatMul_5F_1997(12,77,64);onnx_3A__3A_MatMul_5F_2019(12,64,77)*output:onnx_3A__3A_Reshape_5F_2020(12,77,77) +Reshape_763:Reshape*input:onnx_3A__3A_Reshape_5F_2020(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_2031(1,12,77,77)*allowzero:0 +Add_764:Add*input:onnx_3A__3A_Add_5F_2031(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_2032(1,12,77,77) +Reshape_765:Reshape*input:onnx_3A__3A_Reshape_5F_2032(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_79(12,77,77)*allowzero:0 +Softmax_766:Softmax*input:attn_5F_weights_2E_79(12,77,77)*output:attn_5F_weights_2E_83(12,77,77)*axis:-1 +MatMul_767:MatMul*input:attn_5F_weights_2E_83(12,77,77);onnx_3A__3A_MatMul_5F_2017(12,77,64)*output:onnx_3A__3A_Reshape_5F_2043(12,77,64) +Reshape_768:Reshape*input:onnx_3A__3A_Reshape_5F_2043(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2055(1,12,77,64)*allowzero:0 +Transpose_769:Transpose*input:onnx_3A__3A_Transpose_5F_2055(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_2056(1,77,12,64)*perm:0,2,1,3 +Reshape_770:Reshape*input:onnx_3A__3A_Reshape_5F_2056(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2064(1,77,768)*allowzero:0 +MatMul_771:MatMul*input:onnx_3A__3A_MatMul_5F_2064(1,77,768);onnx_3A__3A_MatMul_5F_2834.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2066(1,77,768) +Add_772:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2066(1,77,768)*output:onnx_3A__3A_Add_5F_2067(1,77,768) +Add_773:Add*input:input_2E_87(1,77,768);onnx_3A__3A_Add_5F_2067(1,77,768)*output:input_2E_91(1,77,768) +ReduceMean_774:ReduceMean*input:input_2E_91(1,77,768)*output:onnx_3A__3A_Sub_5F_2069(1,77,1)*axes:-1 +Sub_775:Sub*input:input_2E_91(1,77,768);onnx_3A__3A_Sub_5F_2069(1,77,1)*output:onnx_3A__3A_Pow_5F_2070(1,77,768) +Pow_777:Pow*input:onnx_3A__3A_Pow_5F_2070(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_2072(1,77,768) +ReduceMean_778:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_2072(1,77,768)*output:onnx_3A__3A_Add_5F_2073(1,77,1)*axes:-1 +Add_780:Add*input:onnx_3A__3A_Add_5F_2073(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_2075(1,77,1) +Sqrt_781:Sqrt*input:onnx_3A__3A_Sqrt_5F_2075(1,77,1)*output:onnx_3A__3A_Div_5F_2076(1,77,1) +Div_782:Div*input:onnx_3A__3A_Pow_5F_2070(1,77,768);onnx_3A__3A_Div_5F_2076(1,77,1)*output:onnx_3A__3A_Mul_5F_2077(1,77,768) +Mul_783:Mul*input:onnx_3A__3A_Mul_5F_2077(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_2078(1,77,768) +Add_784:Add*input:onnx_3A__3A_Add_5F_2078(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_10_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_2079(1,77,768) +MatMul_785:MatMul*input:onnx_3A__3A_MatMul_5F_2079(1,77,768);onnx_3A__3A_MatMul_5F_2835.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_2081(1,77,3072) +Add_786:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_2081(1,77,3072)*output:onnx_3A__3A_Mul_5F_2082(1,77,3072) +Mul_788:Mul*input:onnx_3A__3A_Mul_5F_2082(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_2084(1,77,3072) +Sigmoid_789:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_2084(1,77,3072)*output:onnx_3A__3A_Mul_5F_2085(1,77,3072) +Mul_790:Mul*input:onnx_3A__3A_Mul_5F_2082(1,77,3072);onnx_3A__3A_Mul_5F_2085(1,77,3072)*output:onnx_3A__3A_MatMul_5F_2086(1,77,3072) +MatMul_791:MatMul*input:onnx_3A__3A_MatMul_5F_2086(1,77,3072);onnx_3A__3A_MatMul_5F_2836.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_2088(1,77,768) +Add_792:Add*input:text_5F_model_2E_encoder_2E_layers_2E_10_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2088(1,77,768)*output:onnx_3A__3A_Add_5F_2089(1,77,768) +Add_793:Add*input:input_2E_91(1,77,768);onnx_3A__3A_Add_5F_2089(1,77,768)*output:input_2E_95(1,77,768) +ReduceMean_794:ReduceMean*input:input_2E_95(1,77,768)*output:onnx_3A__3A_Sub_5F_2091(1,77,1)*axes:-1 +Sub_795:Sub*input:input_2E_95(1,77,768);onnx_3A__3A_Sub_5F_2091(1,77,1)*output:onnx_3A__3A_Pow_5F_2092(1,77,768) +Pow_797:Pow*input:onnx_3A__3A_Pow_5F_2092(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_2094(1,77,768) +ReduceMean_798:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_2094(1,77,768)*output:onnx_3A__3A_Add_5F_2095(1,77,1)*axes:-1 +Add_800:Add*input:onnx_3A__3A_Add_5F_2095(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_2097(1,77,1) +Sqrt_801:Sqrt*input:onnx_3A__3A_Sqrt_5F_2097(1,77,1)*output:onnx_3A__3A_Div_5F_2098(1,77,1) +Div_802:Div*input:onnx_3A__3A_Pow_5F_2092(1,77,768);onnx_3A__3A_Div_5F_2098(1,77,1)*output:onnx_3A__3A_Mul_5F_2099(1,77,768) +Mul_803:Mul*input:onnx_3A__3A_Mul_5F_2099(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm1_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_2100(1,77,768) +Add_804:Add*input:onnx_3A__3A_Add_5F_2100(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm1_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_2101(1,77,768) +MatMul_805:MatMul*input:onnx_3A__3A_MatMul_5F_2101(1,77,768);onnx_3A__3A_MatMul_5F_2837.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2106(1,77,768) +Add_806:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_q_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2106(1,77,768)*output:onnx_3A__3A_Mul_5F_2107(1,77,768) +Mul_808:Mul*input:onnx_3A__3A_Mul_5F_2107(1,77,768);onnx_3A__3A_Mul_5F_238.bin(float32:)*output:query_5F_states_2E_43(1,77,768) +MatMul_809:MatMul*input:onnx_3A__3A_MatMul_5F_2101(1,77,768);onnx_3A__3A_MatMul_5F_2838.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2111(1,77,768) +Add_810:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_k_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2111(1,77,768)*output:onnx_3A__3A_Reshape_5F_2112(1,77,768) +Reshape_811:Reshape*input:onnx_3A__3A_Reshape_5F_2112(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2125(1,77,12,64)*allowzero:0 +Transpose_812:Transpose*input:onnx_3A__3A_Transpose_5F_2125(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_2126(1,12,77,64)*perm:0,2,1,3 +MatMul_813:MatMul*input:onnx_3A__3A_MatMul_5F_2101(1,77,768);onnx_3A__3A_MatMul_5F_2844.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2128(1,77,768) +Add_814:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_v_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2128(1,77,768)*output:onnx_3A__3A_Reshape_5F_2129(1,77,768) +Reshape_815:Reshape*input:onnx_3A__3A_Reshape_5F_2129(1,77,768);onnx_3A__3A_Reshape_5F_2282.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2142(1,77,12,64)*allowzero:0 +Transpose_816:Transpose*input:onnx_3A__3A_Transpose_5F_2142(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_2143(1,12,77,64)*perm:0,2,1,3 +Reshape_817:Reshape*input:query_5F_states_2E_43(1,77,768);onnx_3A__3A_Reshape_5F_2293.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2156(1,77,12,64)*allowzero:0 +Transpose_818:Transpose*input:onnx_3A__3A_Transpose_5F_2156(1,77,12,64)*output:onnx_3A__3A_Reshape_5F_2157(1,12,77,64)*perm:0,2,1,3 +Reshape_819:Reshape*input:onnx_3A__3A_Reshape_5F_2157(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2167(12,77,64)*allowzero:0 +Reshape_820:Reshape*input:onnx_3A__3A_Reshape_5F_2126(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_Transpose_5F_2177(12,77,64)*allowzero:0 +Reshape_821:Reshape*input:onnx_3A__3A_Reshape_5F_2143(1,12,77,64);onnx_3A__3A_Reshape_5F_2297.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2187(12,77,64)*allowzero:0 +Transpose_822:Transpose*input:onnx_3A__3A_Transpose_5F_2177(12,77,64)*output:onnx_3A__3A_MatMul_5F_2189(12,64,77)*perm:0,2,1 +MatMul_823:MatMul*input:onnx_3A__3A_MatMul_5F_2167(12,77,64);onnx_3A__3A_MatMul_5F_2189(12,64,77)*output:onnx_3A__3A_Reshape_5F_2190(12,77,77) +Reshape_824:Reshape*input:onnx_3A__3A_Reshape_5F_2190(12,77,77);onnx_3A__3A_Reshape_5F_2310.bin(int64:4)*output:onnx_3A__3A_Add_5F_2201(1,12,77,77)*allowzero:0 +Add_825:Add*input:onnx_3A__3A_Add_5F_2201(1,12,77,77);onnx_3A__3A_Add_5F_220.bin(float32:1,1,77,77)*output:onnx_3A__3A_Reshape_5F_2202(1,12,77,77) +Reshape_826:Reshape*input:onnx_3A__3A_Reshape_5F_2202(1,12,77,77);onnx_3A__3A_Reshape_5F_2314.bin(int64:3)*output:attn_5F_weights_2E_87(12,77,77)*allowzero:0 +Softmax_827:Softmax*input:attn_5F_weights_2E_87(12,77,77)*output:attn_5F_weights_2E_91(12,77,77)*axis:-1 +MatMul_828:MatMul*input:attn_5F_weights_2E_91(12,77,77);onnx_3A__3A_MatMul_5F_2187(12,77,64)*output:onnx_3A__3A_Reshape_5F_2213(12,77,64) +Reshape_829:Reshape*input:onnx_3A__3A_Reshape_5F_2213(12,77,64);onnx_3A__3A_Reshape_5F_2319.bin(int64:4)*output:onnx_3A__3A_Transpose_5F_2225(1,12,77,64)*allowzero:0 +Transpose_830:Transpose*input:onnx_3A__3A_Transpose_5F_2225(1,12,77,64)*output:onnx_3A__3A_Reshape_5F_2226(1,77,12,64)*perm:0,2,1,3 +Reshape_831:Reshape*input:onnx_3A__3A_Reshape_5F_2226(1,77,12,64);onnx_3A__3A_Reshape_5F_2323.bin(int64:3)*output:onnx_3A__3A_MatMul_5F_2234(1,77,768)*allowzero:0 +MatMul_832:MatMul*input:onnx_3A__3A_MatMul_5F_2234(1,77,768);onnx_3A__3A_MatMul_5F_2885.bin(float32:768,768)*output:onnx_3A__3A_Add_5F_2236(1,77,768) +Add_833:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_self_5F_attn_2E_out_5F_proj_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2236(1,77,768)*output:onnx_3A__3A_Add_5F_2237(1,77,768) +Add_834:Add*input:input_2E_95(1,77,768);onnx_3A__3A_Add_5F_2237(1,77,768)*output:input_2E_99(1,77,768) +ReduceMean_835:ReduceMean*input:input_2E_99(1,77,768)*output:onnx_3A__3A_Sub_5F_2239(1,77,1)*axes:-1 +Sub_836:Sub*input:input_2E_99(1,77,768);onnx_3A__3A_Sub_5F_2239(1,77,1)*output:onnx_3A__3A_Pow_5F_2240(1,77,768) +Pow_838:Pow*input:onnx_3A__3A_Pow_5F_2240(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_2242(1,77,768) +ReduceMean_839:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_2242(1,77,768)*output:onnx_3A__3A_Add_5F_2243(1,77,1)*axes:-1 +Add_841:Add*input:onnx_3A__3A_Add_5F_2243(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_2245(1,77,1) +Sqrt_842:Sqrt*input:onnx_3A__3A_Sqrt_5F_2245(1,77,1)*output:onnx_3A__3A_Div_5F_2246(1,77,1) +Div_843:Div*input:onnx_3A__3A_Pow_5F_2240(1,77,768);onnx_3A__3A_Div_5F_2246(1,77,1)*output:onnx_3A__3A_Mul_5F_2247(1,77,768) +Mul_844:Mul*input:onnx_3A__3A_Mul_5F_2247(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm2_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_2248(1,77,768) +Add_845:Add*input:onnx_3A__3A_Add_5F_2248(1,77,768);text_5F_model_2E_encoder_2E_layers_2E_11_2E_layer_5F_norm2_2E_bias.bin(float32:768)*output:onnx_3A__3A_MatMul_5F_2249(1,77,768) +MatMul_846:MatMul*input:onnx_3A__3A_MatMul_5F_2249(1,77,768);onnx_3A__3A_MatMul_5F_2886.bin(float32:768,3072)*output:onnx_3A__3A_Add_5F_2251(1,77,3072) +Add_847:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_mlp_2E_fc1_2E_bias.bin(float32:3072);onnx_3A__3A_Add_5F_2251(1,77,3072)*output:onnx_3A__3A_Mul_5F_2252(1,77,3072) +Mul_849:Mul*input:onnx_3A__3A_Mul_5F_2252(1,77,3072);onnx_3A__3A_Mul_5F_383.bin(float32:)*output:onnx_3A__3A_Sigmoid_5F_2254(1,77,3072) +Sigmoid_850:Sigmoid*input:onnx_3A__3A_Sigmoid_5F_2254(1,77,3072)*output:onnx_3A__3A_Mul_5F_2255(1,77,3072) +Mul_851:Mul*input:onnx_3A__3A_Mul_5F_2252(1,77,3072);onnx_3A__3A_Mul_5F_2255(1,77,3072)*output:onnx_3A__3A_MatMul_5F_2256(1,77,3072) +MatMul_852:MatMul*input:onnx_3A__3A_MatMul_5F_2256(1,77,3072);onnx_3A__3A_MatMul_5F_2887.bin(float32:3072,768)*output:onnx_3A__3A_Add_5F_2258(1,77,768) +Add_853:Add*input:text_5F_model_2E_encoder_2E_layers_2E_11_2E_mlp_2E_fc2_2E_bias.bin(float32:768);onnx_3A__3A_Add_5F_2258(1,77,768)*output:onnx_3A__3A_Add_5F_2259(1,77,768) +Add_854:Add*input:input_2E_99(1,77,768);onnx_3A__3A_Add_5F_2259(1,77,768)*output:input_2E_103(1,77,768) +ReduceMean_855:ReduceMean*input:input_2E_103(1,77,768)*output:onnx_3A__3A_Sub_5F_2261(1,77,1)*axes:-1 +Sub_856:Sub*input:input_2E_103(1,77,768);onnx_3A__3A_Sub_5F_2261(1,77,1)*output:onnx_3A__3A_Pow_5F_2262(1,77,768) +Pow_858:Pow*input:onnx_3A__3A_Pow_5F_2262(1,77,768);onnx_3A__3A_Pow_5F_223.bin(float32:)*output:onnx_3A__3A_ReduceMean_5F_2264(1,77,768) +ReduceMean_859:ReduceMean*input:onnx_3A__3A_ReduceMean_5F_2264(1,77,768)*output:onnx_3A__3A_Add_5F_2265(1,77,1)*axes:-1 +Add_861:Add*input:onnx_3A__3A_Add_5F_2265(1,77,1);onnx_3A__3A_Add_5F_226.bin(float32:)*output:onnx_3A__3A_Sqrt_5F_2267(1,77,1) +Sqrt_862:Sqrt*input:onnx_3A__3A_Sqrt_5F_2267(1,77,1)*output:onnx_3A__3A_Div_5F_2268(1,77,1) +Div_863:Div*input:onnx_3A__3A_Pow_5F_2262(1,77,768);onnx_3A__3A_Div_5F_2268(1,77,1)*output:onnx_3A__3A_Mul_5F_2269(1,77,768) +Mul_864:Mul*input:onnx_3A__3A_Mul_5F_2269(1,77,768);text_5F_model_2E_final_5F_layer_5F_norm_2E_weight.bin(float32:768)*output:onnx_3A__3A_Add_5F_2270(1,77,768) +Add_865:Add*input:onnx_3A__3A_Add_5F_2270(1,77,768);text_5F_model_2E_final_5F_layer_5F_norm_2E_bias.bin(float32:768)*output:2271(1,77,768)