diff --git "a/coreml/feature-extraction/float32_model.mlpackage/Data/com.apple.CoreML/model.mlmodel" "b/coreml/feature-extraction/float32_model.mlpackage/Data/com.apple.CoreML/model.mlmodel" new file mode 100644--- /dev/null +++ "b/coreml/feature-extraction/float32_model.mlpackage/Data/com.apple.CoreML/model.mlmodel" @@ -0,0 +1,17413 @@ +� +L + input_ids2Indices of input sequence tokens in the vocabulary * +��� +w +attention_maskXMask to avoid performing attention on padding token indices (1 = not masked, 0 = masked) * +��� +[ +decoder_input_ids:Indices of decoder input sequence tokens in the vocabulary +* +{�� +~ +decoder_attention_maskXMask to avoid performing attention on padding token indices (1 = not masked, 0 = masked) +* +{��Rc +last_hidden_stateFSequence of hidden-states at the output of the last layer of the model*���� +t5-small (feature-extraction)�3 +#com.github.apple.coremltools.source torch==2.0.1�- +$com.github.apple.coremltools.version7.0b1�) +co.huggingface.exporters.namet5-small�3 +co.huggingface.exporters.taskfeature-extraction�C +%co.huggingface.exporters.architectureT5ForConditionalGeneration�- +"co.huggingface.exporters.frameworkpytorch�- +"co.huggingface.exporters.precisionfloat32��� +�� + +main�� + + + input_ids + + +� +% +attention_mask + + +� +' +decoder_input_ids + + +{ +, +decoder_attention_mask + + +{CoreML5�� + +CoreML5�� +last_hidden_state� +const, +model_shared_weight +  +�� +�*) +name! + +" +model_shared_weight*B +val; +  +�� +�*" +@model_path/weights/weight.bin@� +const@ +/model_encoder_block_0_layer_0_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_encoder_block_0_layer_0_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���� +constL +4model_encoder_block_0_layer_0_SelfAttention_q_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_0_layer_0_SelfAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���� +constL +4model_encoder_block_0_layer_0_SelfAttention_k_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_0_layer_0_SelfAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���� +constL +4model_encoder_block_0_layer_0_SelfAttention_v_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_0_layer_0_SelfAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin��� � +constL +4model_encoder_block_0_layer_0_SelfAttention_o_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_0_layer_0_SelfAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin��� � +const@ +/model_encoder_block_0_layer_1_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_encoder_block_0_layer_1_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���!� +constN +6model_encoder_block_0_layer_1_DenseReluDense_wi_weight +  +� +�*L +nameD +< +:"8 +6model_encoder_block_0_layer_1_DenseReluDense_wi_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���!� +constN +6model_encoder_block_0_layer_1_DenseReluDense_wo_weight +  +� +�*L +nameD +< +:"8 +6model_encoder_block_0_layer_1_DenseReluDense_wo_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���#� +const@ +/model_encoder_block_1_layer_0_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_encoder_block_1_layer_0_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���%� +constL +4model_encoder_block_1_layer_0_SelfAttention_q_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_1_layer_0_SelfAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���%� +constL +4model_encoder_block_1_layer_0_SelfAttention_k_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_1_layer_0_SelfAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���%� +constL +4model_encoder_block_1_layer_0_SelfAttention_v_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_1_layer_0_SelfAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���&� +constL +4model_encoder_block_1_layer_0_SelfAttention_o_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_1_layer_0_SelfAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���&� +const@ +/model_encoder_block_1_layer_1_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_encoder_block_1_layer_1_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���'� +constN +6model_encoder_block_1_layer_1_DenseReluDense_wi_weight +  +� +�*L +nameD +< +:"8 +6model_encoder_block_1_layer_1_DenseReluDense_wi_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�Ȱ'� +constN +6model_encoder_block_1_layer_1_DenseReluDense_wo_weight +  +� +�*L +nameD +< +:"8 +6model_encoder_block_1_layer_1_DenseReluDense_wo_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�Ȱ)� +const@ +/model_encoder_block_2_layer_0_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_encoder_block_2_layer_0_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin�ɰ+� +constL +4model_encoder_block_2_layer_0_SelfAttention_q_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_2_layer_0_SelfAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�ٰ+� +constL +4model_encoder_block_2_layer_0_SelfAttention_k_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_2_layer_0_SelfAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���+� +constL +4model_encoder_block_2_layer_0_SelfAttention_v_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_2_layer_0_SelfAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�ڰ,� +constL +4model_encoder_block_2_layer_0_SelfAttention_o_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_2_layer_0_SelfAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���,� +const@ +/model_encoder_block_2_layer_1_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_encoder_block_2_layer_1_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin�۰-� +constN +6model_encoder_block_2_layer_1_DenseReluDense_wi_weight +  +� +�*L +nameD +< +:"8 +6model_encoder_block_2_layer_1_DenseReluDense_wi_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin��-� +constN +6model_encoder_block_2_layer_1_DenseReluDense_wo_weight +  +� +�*L +nameD +< +:"8 +6model_encoder_block_2_layer_1_DenseReluDense_wo_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin��/� +const@ +/model_encoder_block_3_layer_0_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_encoder_block_3_layer_0_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���1� +constL +4model_encoder_block_3_layer_0_SelfAttention_q_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_3_layer_0_SelfAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���1� +constL +4model_encoder_block_3_layer_0_SelfAttention_k_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_3_layer_0_SelfAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���1� +constL +4model_encoder_block_3_layer_0_SelfAttention_v_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_3_layer_0_SelfAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���2� +constL +4model_encoder_block_3_layer_0_SelfAttention_o_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_3_layer_0_SelfAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���2� +const@ +/model_encoder_block_3_layer_1_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_encoder_block_3_layer_1_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���3� +constN +6model_encoder_block_3_layer_1_DenseReluDense_wi_weight +  +� +�*L +nameD +< +:"8 +6model_encoder_block_3_layer_1_DenseReluDense_wi_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���3� +constN +6model_encoder_block_3_layer_1_DenseReluDense_wo_weight +  +� +�*L +nameD +< +:"8 +6model_encoder_block_3_layer_1_DenseReluDense_wo_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���5� +const@ +/model_encoder_block_4_layer_0_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_encoder_block_4_layer_0_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���7� +constL +4model_encoder_block_4_layer_0_SelfAttention_q_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_4_layer_0_SelfAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���7� +constL +4model_encoder_block_4_layer_0_SelfAttention_k_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_4_layer_0_SelfAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���7� +constL +4model_encoder_block_4_layer_0_SelfAttention_v_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_4_layer_0_SelfAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���8� +constL +4model_encoder_block_4_layer_0_SelfAttention_o_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_4_layer_0_SelfAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���8� +const@ +/model_encoder_block_4_layer_1_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_encoder_block_4_layer_1_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���9� +constN +6model_encoder_block_4_layer_1_DenseReluDense_wi_weight +  +� +�*L +nameD +< +:"8 +6model_encoder_block_4_layer_1_DenseReluDense_wi_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���9� +constN +6model_encoder_block_4_layer_1_DenseReluDense_wo_weight +  +� +�*L +nameD +< +:"8 +6model_encoder_block_4_layer_1_DenseReluDense_wo_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���;� +const@ +/model_encoder_block_5_layer_0_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_encoder_block_5_layer_0_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���=� +constL +4model_encoder_block_5_layer_0_SelfAttention_q_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_5_layer_0_SelfAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�ű=� +constL +4model_encoder_block_5_layer_0_SelfAttention_k_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_5_layer_0_SelfAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���=� +constL +4model_encoder_block_5_layer_0_SelfAttention_v_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_5_layer_0_SelfAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�Ʊ>� +constL +4model_encoder_block_5_layer_0_SelfAttention_o_weight +  +� +�*J +nameB +: +8"6 +4model_encoder_block_5_layer_0_SelfAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���>� +const@ +/model_encoder_block_5_layer_1_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_encoder_block_5_layer_1_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin�DZ?� +constN +6model_encoder_block_5_layer_1_DenseReluDense_wi_weight +  +� +�*L +nameD +< +:"8 +6model_encoder_block_5_layer_1_DenseReluDense_wi_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�ر?� +constN +6model_encoder_block_5_layer_1_DenseReluDense_wo_weight +  +� +�*L +nameD +< +:"8 +6model_encoder_block_5_layer_1_DenseReluDense_wo_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�رA� +const6 +%model_encoder_final_layer_norm_weight +   +�*; +name3 ++ +)"' +%model_encoder_final_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin�ٱC� +const@ +/model_decoder_block_0_layer_0_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_0_layer_0_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin��C� +constL +4model_decoder_block_0_layer_0_SelfAttention_q_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_0_layer_0_SelfAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���C� +constL +4model_decoder_block_0_layer_0_SelfAttention_k_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_0_layer_0_SelfAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���C� +constL +4model_decoder_block_0_layer_0_SelfAttention_v_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_0_layer_0_SelfAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���D� +constL +4model_decoder_block_0_layer_0_SelfAttention_o_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_0_layer_0_SelfAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���D� +const@ +/model_decoder_block_0_layer_1_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_0_layer_1_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���E� +constN +6model_decoder_block_0_layer_1_EncDecAttention_q_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_0_layer_1_EncDecAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���E� +constN +6model_decoder_block_0_layer_1_EncDecAttention_k_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_0_layer_1_EncDecAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���E� +constN +6model_decoder_block_0_layer_1_EncDecAttention_v_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_0_layer_1_EncDecAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���F� +constN +6model_decoder_block_0_layer_1_EncDecAttention_o_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_0_layer_1_EncDecAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���F� +const@ +/model_decoder_block_0_layer_2_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_0_layer_2_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���G� +constN +6model_decoder_block_0_layer_2_DenseReluDense_wi_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_0_layer_2_DenseReluDense_wi_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���G� +constN +6model_decoder_block_0_layer_2_DenseReluDense_wo_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_0_layer_2_DenseReluDense_wo_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���I� +const@ +/model_decoder_block_1_layer_0_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_1_layer_0_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���K� +constL +4model_decoder_block_1_layer_0_SelfAttention_q_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_1_layer_0_SelfAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���K� +constL +4model_decoder_block_1_layer_0_SelfAttention_k_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_1_layer_0_SelfAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���K� +constL +4model_decoder_block_1_layer_0_SelfAttention_v_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_1_layer_0_SelfAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���L� +constL +4model_decoder_block_1_layer_0_SelfAttention_o_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_1_layer_0_SelfAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���L� +const@ +/model_decoder_block_1_layer_1_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_1_layer_1_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���M� +constN +6model_decoder_block_1_layer_1_EncDecAttention_q_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_1_layer_1_EncDecAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�òM� +constN +6model_decoder_block_1_layer_1_EncDecAttention_k_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_1_layer_1_EncDecAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���M� +constN +6model_decoder_block_1_layer_1_EncDecAttention_v_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_1_layer_1_EncDecAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�IJN� +constN +6model_decoder_block_1_layer_1_EncDecAttention_o_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_1_layer_1_EncDecAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���N� +const@ +/model_decoder_block_1_layer_2_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_1_layer_2_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin�ŲO� +constN +6model_decoder_block_1_layer_2_DenseReluDense_wi_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_1_layer_2_DenseReluDense_wi_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�ղO� +constN +6model_decoder_block_1_layer_2_DenseReluDense_wo_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_1_layer_2_DenseReluDense_wo_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�ֲQ� +const@ +/model_decoder_block_2_layer_0_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_2_layer_0_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin�ֲS� +constL +4model_decoder_block_2_layer_0_SelfAttention_q_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_2_layer_0_SelfAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin��S� +constL +4model_decoder_block_2_layer_0_SelfAttention_k_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_2_layer_0_SelfAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���S� +constL +4model_decoder_block_2_layer_0_SelfAttention_v_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_2_layer_0_SelfAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin��T� +constL +4model_decoder_block_2_layer_0_SelfAttention_o_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_2_layer_0_SelfAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���T� +const@ +/model_decoder_block_2_layer_1_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_2_layer_1_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin��U� +constN +6model_decoder_block_2_layer_1_EncDecAttention_q_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_2_layer_1_EncDecAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���U� +constN +6model_decoder_block_2_layer_1_EncDecAttention_k_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_2_layer_1_EncDecAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���U� +constN +6model_decoder_block_2_layer_1_EncDecAttention_v_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_2_layer_1_EncDecAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���V� +constN +6model_decoder_block_2_layer_1_EncDecAttention_o_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_2_layer_1_EncDecAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���V� +const@ +/model_decoder_block_2_layer_2_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_2_layer_2_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���W� +constN +6model_decoder_block_2_layer_2_DenseReluDense_wi_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_2_layer_2_DenseReluDense_wi_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���W� +constN +6model_decoder_block_2_layer_2_DenseReluDense_wo_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_2_layer_2_DenseReluDense_wo_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���Y� +const@ +/model_decoder_block_3_layer_0_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_3_layer_0_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���[� +constL +4model_decoder_block_3_layer_0_SelfAttention_q_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_3_layer_0_SelfAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���[� +constL +4model_decoder_block_3_layer_0_SelfAttention_k_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_3_layer_0_SelfAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���[� +constL +4model_decoder_block_3_layer_0_SelfAttention_v_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_3_layer_0_SelfAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���\� +constL +4model_decoder_block_3_layer_0_SelfAttention_o_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_3_layer_0_SelfAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���\� +const@ +/model_decoder_block_3_layer_1_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_3_layer_1_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���]� +constN +6model_decoder_block_3_layer_1_EncDecAttention_q_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_3_layer_1_EncDecAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���]� +constN +6model_decoder_block_3_layer_1_EncDecAttention_k_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_3_layer_1_EncDecAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���]� +constN +6model_decoder_block_3_layer_1_EncDecAttention_v_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_3_layer_1_EncDecAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���^� +constN +6model_decoder_block_3_layer_1_EncDecAttention_o_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_3_layer_1_EncDecAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���^� +const@ +/model_decoder_block_3_layer_2_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_3_layer_2_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���_� +constN +6model_decoder_block_3_layer_2_DenseReluDense_wi_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_3_layer_2_DenseReluDense_wi_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�³_� +constN +6model_decoder_block_3_layer_2_DenseReluDense_wo_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_3_layer_2_DenseReluDense_wo_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�óa� +const@ +/model_decoder_block_4_layer_0_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_4_layer_0_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin�óc� +constL +4model_decoder_block_4_layer_0_SelfAttention_q_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_4_layer_0_SelfAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�Գc� +constL +4model_decoder_block_4_layer_0_SelfAttention_k_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_4_layer_0_SelfAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���c� +constL +4model_decoder_block_4_layer_0_SelfAttention_v_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_4_layer_0_SelfAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�ճd� +constL +4model_decoder_block_4_layer_0_SelfAttention_o_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_4_layer_0_SelfAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���d� +const@ +/model_decoder_block_4_layer_1_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_4_layer_1_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin�ֳe� +constN +6model_decoder_block_4_layer_1_EncDecAttention_q_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_4_layer_1_EncDecAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin��e� +constN +6model_decoder_block_4_layer_1_EncDecAttention_k_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_4_layer_1_EncDecAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���e� +constN +6model_decoder_block_4_layer_1_EncDecAttention_v_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_4_layer_1_EncDecAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin��f� +constN +6model_decoder_block_4_layer_1_EncDecAttention_o_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_4_layer_1_EncDecAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���f� +const@ +/model_decoder_block_4_layer_2_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_4_layer_2_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin��g� +constN +6model_decoder_block_4_layer_2_DenseReluDense_wi_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_4_layer_2_DenseReluDense_wi_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���g� +constN +6model_decoder_block_4_layer_2_DenseReluDense_wo_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_4_layer_2_DenseReluDense_wo_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���i� +const@ +/model_decoder_block_5_layer_0_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_5_layer_0_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���k� +constL +4model_decoder_block_5_layer_0_SelfAttention_q_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_5_layer_0_SelfAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���k� +constL +4model_decoder_block_5_layer_0_SelfAttention_k_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_5_layer_0_SelfAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���k� +constL +4model_decoder_block_5_layer_0_SelfAttention_v_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_5_layer_0_SelfAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���l� +constL +4model_decoder_block_5_layer_0_SelfAttention_o_weight +  +� +�*J +nameB +: +8"6 +4model_decoder_block_5_layer_0_SelfAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���l� +const@ +/model_decoder_block_5_layer_1_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_5_layer_1_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���m� +constN +6model_decoder_block_5_layer_1_EncDecAttention_q_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_5_layer_1_EncDecAttention_q_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���m� +constN +6model_decoder_block_5_layer_1_EncDecAttention_k_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_5_layer_1_EncDecAttention_k_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���m� +constN +6model_decoder_block_5_layer_1_EncDecAttention_v_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_5_layer_1_EncDecAttention_v_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���n� +constN +6model_decoder_block_5_layer_1_EncDecAttention_o_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_5_layer_1_EncDecAttention_o_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���n� +const@ +/model_decoder_block_5_layer_2_layer_norm_weight +   +�*E +name= +5 +3"1 +/model_decoder_block_5_layer_2_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���o� +constN +6model_decoder_block_5_layer_2_DenseReluDense_wi_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_5_layer_2_DenseReluDense_wi_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���o� +constN +6model_decoder_block_5_layer_2_DenseReluDense_wo_weight +  +� +�*L +nameD +< +:"8 +6model_decoder_block_5_layer_2_DenseReluDense_wo_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���q� +const6 +%model_decoder_final_layer_norm_weight +   +�*; +name3 ++ +)"' +%model_decoder_final_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���sS +const +var_9 +* +name + + +" +op_9* +val + + + +���������O +const +var_17 + * +name + + " +op_17* +val +  + + + +�?L +const +var_19 +* +name + + " +op_19* +val + + +] +const +input_3_axis_0 +*$ +name + +" +input_3_axis_0* +val + + +� +gather +x + +model_shared_weight +indices + + input_ids +axis + +input_3_axis_0% +input_3 +  + +� +�* +name + + " +input_3j +const + var_48_axes_0 + + +*" +name + +" + op_48_axes_0* +val + + + + +� + expand_dims +x + +attention_mask +axes + + var_48_axes_0# +var_48 + + + +�* +name + + " +op_48j +const + var_49_axes_0 + + +*" +name + +" + op_49_axes_0* +val + + + + +� + expand_dims +x + + +var_48 +axes + + var_49_axes_0) +var_49 + + + + +�* +name + + " +op_49_ +const +var_51_dtype_0 +*# +name + +" + op_51_dtype_0* +val + + +" +fp32 +cast +x + + +var_49 +dtype + +var_51_dtype_0* +cast_87 +  + + + +�* +name + + " +cast_87p +sub +x + + +var_17 +y + +cast_87) +var_52 +  + + + +�* +name + + " +op_52O +const +var_53 + * +name + + " +op_53* +val +  + + + +���p +mul +x + + +var_52 +y + + +var_53) +mask_1 +  + + + +�* +name + + +" +mask_1a +const +var_13_promoted + *$ +name + +" +op_13_promoted* +val +  + + + +@t +pow +x + +input_3 +y + +var_13_promoted$ +var_64 +  + +� +�* +name + + " +op_64e +const +var_65 + + +* +name + + " +op_65*' +val  + + + + + +���������� + reduce_mean +x + + +var_64 +axes + + +var_65 + keep_dims + + +var_19' + +variance_1 +  + +� +* +name + +" + +variance_1O +const +var_67 + * +name + + " +op_67* +val +  + + + +�7�5m +add +x + + +variance_1 +y + + +var_67# +var_68 +  + +� +* +name + + " +op_68c +const +var_69_epsilon_0 + *% +name + +" +op_69_epsilon_0* +val +  + + + +̼�+{ +rsqrt +x + + +var_68 +epsilon + +var_69_epsilon_0# +var_69 +  + +� +* +name + + " +op_69~ +mul +x + +input_3 +y + + +var_69- +hidden_states_5 +  + +� +�*% +name + +" +hidden_states_5� +mul8 +x3 +1 +/model_encoder_block_0_layer_0_layer_norm_weight +y + +hidden_states_5- +hidden_states_7 +  + +� +�*% +name + +" +hidden_states_7� +const +states_1_bias_0 +   +�*% +name + +" +states_1_bias_0*= +val6 +   +�*% +@model_path/weights/weight.bin���s� +linear +x + +hidden_states_7B +weight8 +6 +4model_encoder_block_0_layer_0_SelfAttention_q_weight +bias + +states_1_bias_0& +states_1 +  + +� +�* +name + + " + +states_1h +const +var_84 + + +* +name + + " +op_84** +val# + + + + + ���������@y +reshape +x + + +states_1 +shape + + +var_84) +var_85 +  + +� + +@* +name + + " +op_85� +linear +x + +hidden_states_7B +weight8 +6 +4model_encoder_block_0_layer_0_SelfAttention_k_weight +bias + +states_1_bias_0& +states_3 +  + +� +�* +name + + " + +states_3h +const +var_89 + + +* +name + + " +op_89** +val# + + + + + ���������@y +reshape +x + + +states_3 +shape + + +var_89) +var_90 +  + +� + +@* +name + + " +op_90� +linear +x + +hidden_states_7B +weight8 +6 +4model_encoder_block_0_layer_0_SelfAttention_v_weight +bias + +states_1_bias_0& +states_5 +  + +� +�* +name + + " + +states_5h +const +var_94 + + +* +name + + " +op_94** +val# + + + + + ���������@y +reshape +x + + +states_5 +shape + + +var_94) +var_95 +  + +� + +@* +name + + " +op_95~ +const% +value_states_1_perm_0 + + +*+ +name# + +" +value_states_1_perm_0*! +val + + + + + +m +const +scores_1_transpose_x_0 +*, +name$ + +" +scores_1_transpose_x_0* +val + + +m +const +scores_1_transpose_y_0 +*, +name$ + +" +scores_1_transpose_y_0* +val + + +z +const# +transpose_54_perm_0 + + +*) +name! + +" +transpose_54_perm_0*! +val + + + + + +z +const# +transpose_55_perm_0 + + +*) +name! + +" +transpose_55_perm_0*! +val + + + + + +� + transpose +x + + +var_90 +perm + +transpose_55_perm_00 + transpose_159 +  + + +@ +�*# +name + +" + transpose_159� + transpose +x + + +var_85 +perm + +transpose_54_perm_00 + transpose_160 +  + + +� +@*# +name + +" + transpose_160� +matmul +x + + transpose_160 +y + + transpose_159) + transpose_x + +scores_1_transpose_x_0) + transpose_y + +scores_1_transpose_y_0, +scores_1 +  + + +� +�* +name + + " + +scores_1� +const3 +position_bias_1 +  + + +� +�*% +name + +" +position_bias_1*P +valI +  + + +� +�*% +@model_path/weights/weight.bin�Ѵs� +add +x + +position_bias_1 +y + + +mask_13 +position_bias_3 +  + + +� +�*% +name + +" +position_bias_3� +add +x + + +scores_1 +y + +position_bias_3, +scores_3 +  + + +� +�* +name + + " + +scores_3z +softmax +x + + +scores_3 +axis + +var_9+ +var_137 +  + + +� +�* +name + + +" +op_137h +identity +x + +var_137+ +input_9 +  + + +� +�* +name + + " +input_9m +const +states_7_transpose_x_0 +*, +name$ + +" +states_7_transpose_x_0* +val + + +m +const +states_7_transpose_y_0 +*, +name$ + +" +states_7_transpose_y_0* +val + + +� + transpose +x + + +var_95! +perm + +value_states_1_perm_00 + transpose_161 +  + + +� +@*# +name + +" + transpose_161� +matmul +x + +input_9 +y + + transpose_161) + transpose_x + +states_7_transpose_x_0) + transpose_y + +states_7_transpose_y_0+ +states_7 +  + + +� +@* +name + + " + +states_7o +const +var_141_perm_0 + + +*# +name + +" + op_141_perm_0*! +val + + + + + +j +const +var_143 + + +* +name + + +" +op_143** +val# + + + + + ����������� + transpose +x + + +states_7 +perm + +var_141_perm_00 + transpose_158 +  + +� + +@*# +name + +" + transpose_158 +reshape +x + + transpose_158 +shape + +var_143& +input_11 +  + +� +�* +name + + " + +input_11� +linear +x + + +input_11B +weight8 +6 +4model_encoder_block_0_layer_0_SelfAttention_o_weight +bias + +states_1_bias_0& +input_13 +  + +� +�* +name + + " + +input_13� +add +x + +input_3 +y + + +input_13- +hidden_states_9 +  + +� +�*% +name + +" +hidden_states_9e +const +var_13_promoted_1 + *& +name + +" +op_13_promoted_1* +val +  + + + +@� +pow +x + +hidden_states_9 +y + +var_13_promoted_1% +var_159 +  + +� +�* +name + + +" +op_159g +const +var_160 + + +* +name + + +" +op_160*' +val  + + + + + +���������� + reduce_mean +x + +var_159 +axes + +var_160 + keep_dims + + +var_19' + +variance_3 +  + +� +* +name + +" + +variance_3Q +const +var_162 + * +name + + +" +op_162* +val +  + + + +�7�5p +add +x + + +variance_3 +y + +var_162$ +var_163 +  + +� +* +name + + +" +op_163e +const +var_164_epsilon_0 + *& +name + +" +op_164_epsilon_0* +val +  + + + +̼�+ +rsqrt +x + +var_163 +epsilon + +var_164_epsilon_0$ +var_164 +  + +� +* +name + + +" +op_164� +mul +x + +hidden_states_9 +y + +var_164. +hidden_states_13 +  + +� +�*& +name + +" +hidden_states_13� +mul8 +x3 +1 +/model_encoder_block_0_layer_1_layer_norm_weight +y + +hidden_states_13& +input_15 +  + +� +�* +name + + " + +input_15� +const +input_17_bias_0 +   +�*% +name + +" +input_17_bias_0*= +val6 +   +�*% +@model_path/weights/weight.bin���s� +linear +x + + +input_15D +weight: +8 +6model_encoder_block_0_layer_1_DenseReluDense_wi_weight +bias + +input_17_bias_0& +input_17 +  + +� +�* +name + + " + +input_17a +relu +x + + +input_17& +input_19 +  + +� +�* +name + + " + +input_19� +linear +x + + +input_19D +weight: +8 +6model_encoder_block_0_layer_1_DenseReluDense_wo_weight +bias + +states_1_bias_0& +input_23 +  + +� +�* +name + + " + +input_23� +add +x + +hidden_states_9 +y + + +input_23. +hidden_states_15 +  + +� +�*& +name + +" +hidden_states_15e +const +var_13_promoted_2 + *& +name + +" +op_13_promoted_2* +val +  + + + +@� +pow +x + +hidden_states_15 +y + +var_13_promoted_2% +var_191 +  + +� +�* +name + + +" +op_191g +const +var_192 + + +* +name + + +" +op_192*' +val  + + + + + +���������� + reduce_mean +x + +var_191 +axes + +var_192 + keep_dims + + +var_19' + +variance_5 +  + +� +* +name + +" + +variance_5Q +const +var_194 + * +name + + +" +op_194* +val +  + + + +�7�5p +add +x + + +variance_5 +y + +var_194$ +var_195 +  + +� +* +name + + +" +op_195e +const +var_196_epsilon_0 + *& +name + +" +op_196_epsilon_0* +val +  + + + +̼�+ +rsqrt +x + +var_195 +epsilon + +var_196_epsilon_0$ +var_196 +  + +� +* +name + + +" +op_196� +mul +x + +hidden_states_15 +y + +var_196. +hidden_states_19 +  + +� +�*& +name + +" +hidden_states_19� +mul8 +x3 +1 +/model_encoder_block_1_layer_0_layer_norm_weight +y + +hidden_states_19. +hidden_states_21 +  + +� +�*& +name + +" +hidden_states_21� +linear +x + +hidden_states_21B +weight8 +6 +4model_encoder_block_1_layer_0_SelfAttention_q_weight +bias + +states_1_bias_0& +states_9 +  + +� +�* +name + + " + +states_9j +const +var_209 + + +* +name + + +" +op_209** +val# + + + + + ���������@| +reshape +x + + +states_9 +shape + +var_209* +var_210 +  + +� + +@* +name + + +" +op_210� +linear +x + +hidden_states_21B +weight8 +6 +4model_encoder_block_1_layer_0_SelfAttention_k_weight +bias + +states_1_bias_0' + states_11 +  + +� +�* +name + + " + states_11j +const +var_214 + + +* +name + + +" +op_214** +val# + + + + + ���������@} +reshape +x + + states_11 +shape + +var_214* +var_215 +  + +� + +@* +name + + +" +op_215� +linear +x + +hidden_states_21B +weight8 +6 +4model_encoder_block_1_layer_0_SelfAttention_v_weight +bias + +states_1_bias_0' + states_13 +  + +� +�* +name + + " + states_13j +const +var_219 + + +* +name + + +" +op_219** +val# + + + + + ���������@} +reshape +x + + states_13 +shape + +var_219* +var_220 +  + +� + +@* +name + + +" +op_220~ +const% +value_states_3_perm_0 + + +*+ +name# + +" +value_states_3_perm_0*! +val + + + + + +m +const +scores_5_transpose_x_0 +*, +name$ + +" +scores_5_transpose_x_0* +val + + +m +const +scores_5_transpose_y_0 +*, +name$ + +" +scores_5_transpose_y_0* +val + + +z +const# +transpose_56_perm_0 + + +*) +name! + +" +transpose_56_perm_0*! +val + + + + + +z +const# +transpose_57_perm_0 + + +*) +name! + +" +transpose_57_perm_0*! +val + + + + + +� + transpose +x + +var_215 +perm + +transpose_57_perm_00 + transpose_155 +  + + +@ +�*# +name + +" + transpose_155� + transpose +x + +var_210 +perm + +transpose_56_perm_00 + transpose_156 +  + + +� +@*# +name + +" + transpose_156� +matmul +x + + transpose_156 +y + + transpose_155) + transpose_x + +scores_5_transpose_x_0) + transpose_y + +scores_5_transpose_y_0, +scores_5 +  + + +� +�* +name + + " + +scores_5� +add +x + + +scores_5 +y + +position_bias_3, +scores_7 +  + + +� +�* +name + + " + +scores_7z +softmax +x + + +scores_7 +axis + +var_9+ +var_226 +  + + +� +�* +name + + +" +op_226j +identity +x + +var_226, +input_27 +  + + +� +�* +name + + " + +input_27o +const +states_15_transpose_x_0 +*- +name% + +" +states_15_transpose_x_0* +val + + +o +const +states_15_transpose_y_0 +*- +name% + +" +states_15_transpose_y_0* +val + + +� + transpose +x + +var_220! +perm + +value_states_3_perm_00 + transpose_157 +  + + +� +@*# +name + +" + transpose_157� +matmul +x + + +input_27 +y + + transpose_157* + transpose_x + +states_15_transpose_x_0* + transpose_y + +states_15_transpose_y_0, + states_15 +  + + +� +@* +name + + " + states_15o +const +var_230_perm_0 + + +*# +name + +" + op_230_perm_0*! +val + + + + + +j +const +var_232 + + +* +name + + +" +op_232** +val# + + + + + ����������� + transpose +x + + states_15 +perm + +var_230_perm_00 + transpose_154 +  + +� + +@*# +name + +" + transpose_154 +reshape +x + + transpose_154 +shape + +var_232& +input_29 +  + +� +�* +name + + " + +input_29� +linear +x + + +input_29B +weight8 +6 +4model_encoder_block_1_layer_0_SelfAttention_o_weight +bias + +states_1_bias_0& +input_31 +  + +� +�* +name + + " + +input_31� +add +x + +hidden_states_15 +y + + +input_31. +hidden_states_23 +  + +� +�*& +name + +" +hidden_states_23e +const +var_13_promoted_3 + *& +name + +" +op_13_promoted_3* +val +  + + + +@� +pow +x + +hidden_states_23 +y + +var_13_promoted_3% +var_242 +  + +� +�* +name + + +" +op_242g +const +var_243 + + +* +name + + +" +op_243*' +val  + + + + + +���������� + reduce_mean +x + +var_242 +axes + +var_243 + keep_dims + + +var_19' + +variance_7 +  + +� +* +name + +" + +variance_7Q +const +var_245 + * +name + + +" +op_245* +val +  + + + +�7�5p +add +x + + +variance_7 +y + +var_245$ +var_246 +  + +� +* +name + + +" +op_246e +const +var_247_epsilon_0 + *& +name + +" +op_247_epsilon_0* +val +  + + + +̼�+ +rsqrt +x + +var_246 +epsilon + +var_247_epsilon_0$ +var_247 +  + +� +* +name + + +" +op_247� +mul +x + +hidden_states_23 +y + +var_247. +hidden_states_27 +  + +� +�*& +name + +" +hidden_states_27� +mul8 +x3 +1 +/model_encoder_block_1_layer_1_layer_norm_weight +y + +hidden_states_27& +input_33 +  + +� +�* +name + + " + +input_33� +linear +x + + +input_33D +weight: +8 +6model_encoder_block_1_layer_1_DenseReluDense_wi_weight +bias + +input_17_bias_0& +input_35 +  + +� +�* +name + + " + +input_35a +relu +x + + +input_35& +input_37 +  + +� +�* +name + + " + +input_37� +linear +x + + +input_37D +weight: +8 +6model_encoder_block_1_layer_1_DenseReluDense_wo_weight +bias + +states_1_bias_0& +input_41 +  + +� +�* +name + + " + +input_41� +add +x + +hidden_states_23 +y + + +input_41. +hidden_states_29 +  + +� +�*& +name + +" +hidden_states_29e +const +var_13_promoted_4 + *& +name + +" +op_13_promoted_4* +val +  + + + +@� +pow +x + +hidden_states_29 +y + +var_13_promoted_4% +var_271 +  + +� +�* +name + + +" +op_271g +const +var_272 + + +* +name + + +" +op_272*' +val  + + + + + +���������� + reduce_mean +x + +var_271 +axes + +var_272 + keep_dims + + +var_19' + +variance_9 +  + +� +* +name + +" + +variance_9Q +const +var_274 + * +name + + +" +op_274* +val +  + + + +�7�5p +add +x + + +variance_9 +y + +var_274$ +var_275 +  + +� +* +name + + +" +op_275e +const +var_276_epsilon_0 + *& +name + +" +op_276_epsilon_0* +val +  + + + +̼�+ +rsqrt +x + +var_275 +epsilon + +var_276_epsilon_0$ +var_276 +  + +� +* +name + + +" +op_276� +mul +x + +hidden_states_29 +y + +var_276. +hidden_states_33 +  + +� +�*& +name + +" +hidden_states_33� +mul8 +x3 +1 +/model_encoder_block_2_layer_0_layer_norm_weight +y + +hidden_states_33. +hidden_states_35 +  + +� +�*& +name + +" +hidden_states_35� +linear +x + +hidden_states_35B +weight8 +6 +4model_encoder_block_2_layer_0_SelfAttention_q_weight +bias + +states_1_bias_0' + states_17 +  + +� +�* +name + + " + states_17j +const +var_289 + + +* +name + + +" +op_289** +val# + + + + + ���������@} +reshape +x + + states_17 +shape + +var_289* +var_290 +  + +� + +@* +name + + +" +op_290� +linear +x + +hidden_states_35B +weight8 +6 +4model_encoder_block_2_layer_0_SelfAttention_k_weight +bias + +states_1_bias_0' + states_19 +  + +� +�* +name + + " + states_19j +const +var_294 + + +* +name + + +" +op_294** +val# + + + + + ���������@} +reshape +x + + states_19 +shape + +var_294* +var_295 +  + +� + +@* +name + + +" +op_295� +linear +x + +hidden_states_35B +weight8 +6 +4model_encoder_block_2_layer_0_SelfAttention_v_weight +bias + +states_1_bias_0' + states_21 +  + +� +�* +name + + " + states_21j +const +var_299 + + +* +name + + +" +op_299** +val# + + + + + ���������@} +reshape +x + + states_21 +shape + +var_299* +var_300 +  + +� + +@* +name + + +" +op_300~ +const% +value_states_5_perm_0 + + +*+ +name# + +" +value_states_5_perm_0*! +val + + + + + +m +const +scores_9_transpose_x_0 +*, +name$ + +" +scores_9_transpose_x_0* +val + + +m +const +scores_9_transpose_y_0 +*, +name$ + +" +scores_9_transpose_y_0* +val + + +z +const# +transpose_58_perm_0 + + +*) +name! + +" +transpose_58_perm_0*! +val + + + + + +z +const# +transpose_59_perm_0 + + +*) +name! + +" +transpose_59_perm_0*! +val + + + + + +� + transpose +x + +var_295 +perm + +transpose_59_perm_00 + transpose_151 +  + + +@ +�*# +name + +" + transpose_151� + transpose +x + +var_290 +perm + +transpose_58_perm_00 + transpose_152 +  + + +� +@*# +name + +" + transpose_152� +matmul +x + + transpose_152 +y + + transpose_151) + transpose_x + +scores_9_transpose_x_0) + transpose_y + +scores_9_transpose_y_0, +scores_9 +  + + +� +�* +name + + " + +scores_9� +add +x + + +scores_9 +y + +position_bias_3- + scores_11 +  + + +� +�* +name + + " + scores_11{ +softmax +x + + scores_11 +axis + +var_9+ +var_306 +  + + +� +�* +name + + +" +op_306j +identity +x + +var_306, +input_45 +  + + +� +�* +name + + " + +input_45o +const +states_23_transpose_x_0 +*- +name% + +" +states_23_transpose_x_0* +val + + +o +const +states_23_transpose_y_0 +*- +name% + +" +states_23_transpose_y_0* +val + + +� + transpose +x + +var_300! +perm + +value_states_5_perm_00 + transpose_153 +  + + +� +@*# +name + +" + transpose_153� +matmul +x + + +input_45 +y + + transpose_153* + transpose_x + +states_23_transpose_x_0* + transpose_y + +states_23_transpose_y_0, + states_23 +  + + +� +@* +name + + " + states_23o +const +var_310_perm_0 + + +*# +name + +" + op_310_perm_0*! +val + + + + + +j +const +var_312 + + +* +name + + +" +op_312** +val# + + + + + ����������� + transpose +x + + states_23 +perm + +var_310_perm_00 + transpose_150 +  + +� + +@*# +name + +" + transpose_150 +reshape +x + + transpose_150 +shape + +var_312& +input_47 +  + +� +�* +name + + " + +input_47� +linear +x + + +input_47B +weight8 +6 +4model_encoder_block_2_layer_0_SelfAttention_o_weight +bias + +states_1_bias_0& +input_49 +  + +� +�* +name + + " + +input_49� +add +x + +hidden_states_29 +y + + +input_49. +hidden_states_37 +  + +� +�*& +name + +" +hidden_states_37e +const +var_13_promoted_5 + *& +name + +" +op_13_promoted_5* +val +  + + + +@� +pow +x + +hidden_states_37 +y + +var_13_promoted_5% +var_322 +  + +� +�* +name + + +" +op_322g +const +var_323 + + +* +name + + +" +op_323*' +val  + + + + + +���������� + reduce_mean +x + +var_322 +axes + +var_323 + keep_dims + + +var_19( + variance_11 +  + +� +*! +name + +" + variance_11Q +const +var_325 + * +name + + +" +op_325* +val +  + + + +�7�5q +add +x + + variance_11 +y + +var_325$ +var_326 +  + +� +* +name + + +" +op_326e +const +var_327_epsilon_0 + *& +name + +" +op_327_epsilon_0* +val +  + + + +̼�+ +rsqrt +x + +var_326 +epsilon + +var_327_epsilon_0$ +var_327 +  + +� +* +name + + +" +op_327� +mul +x + +hidden_states_37 +y + +var_327. +hidden_states_41 +  + +� +�*& +name + +" +hidden_states_41� +mul8 +x3 +1 +/model_encoder_block_2_layer_1_layer_norm_weight +y + +hidden_states_41& +input_51 +  + +� +�* +name + + " + +input_51� +linear +x + + +input_51D +weight: +8 +6model_encoder_block_2_layer_1_DenseReluDense_wi_weight +bias + +input_17_bias_0& +input_53 +  + +� +�* +name + + " + +input_53a +relu +x + + +input_53& +input_55 +  + +� +�* +name + + " + +input_55� +linear +x + + +input_55D +weight: +8 +6model_encoder_block_2_layer_1_DenseReluDense_wo_weight +bias + +states_1_bias_0& +input_59 +  + +� +�* +name + + " + +input_59� +add +x + +hidden_states_37 +y + + +input_59. +hidden_states_43 +  + +� +�*& +name + +" +hidden_states_43e +const +var_13_promoted_6 + *& +name + +" +op_13_promoted_6* +val +  + + + +@� +pow +x + +hidden_states_43 +y + +var_13_promoted_6% +var_351 +  + +� +�* +name + + +" +op_351g +const +var_352 + + +* +name + + +" +op_352*' +val  + + + + + +���������� + reduce_mean +x + +var_351 +axes + +var_352 + keep_dims + + +var_19( + variance_13 +  + +� +*! +name + +" + variance_13Q +const +var_354 + * +name + + +" +op_354* +val +  + + + +�7�5q +add +x + + variance_13 +y + +var_354$ +var_355 +  + +� +* +name + + +" +op_355e +const +var_356_epsilon_0 + *& +name + +" +op_356_epsilon_0* +val +  + + + +̼�+ +rsqrt +x + +var_355 +epsilon + +var_356_epsilon_0$ +var_356 +  + +� +* +name + + +" +op_356� +mul +x + +hidden_states_43 +y + +var_356. +hidden_states_47 +  + +� +�*& +name + +" +hidden_states_47� +mul8 +x3 +1 +/model_encoder_block_3_layer_0_layer_norm_weight +y + +hidden_states_47. +hidden_states_49 +  + +� +�*& +name + +" +hidden_states_49� +linear +x + +hidden_states_49B +weight8 +6 +4model_encoder_block_3_layer_0_SelfAttention_q_weight +bias + +states_1_bias_0' + states_25 +  + +� +�* +name + + " + states_25j +const +var_369 + + +* +name + + +" +op_369** +val# + + + + + ���������@} +reshape +x + + states_25 +shape + +var_369* +var_370 +  + +� + +@* +name + + +" +op_370� +linear +x + +hidden_states_49B +weight8 +6 +4model_encoder_block_3_layer_0_SelfAttention_k_weight +bias + +states_1_bias_0' + states_27 +  + +� +�* +name + + " + states_27j +const +var_374 + + +* +name + + +" +op_374** +val# + + + + + ���������@} +reshape +x + + states_27 +shape + +var_374* +var_375 +  + +� + +@* +name + + +" +op_375� +linear +x + +hidden_states_49B +weight8 +6 +4model_encoder_block_3_layer_0_SelfAttention_v_weight +bias + +states_1_bias_0' + states_29 +  + +� +�* +name + + " + states_29j +const +var_379 + + +* +name + + +" +op_379** +val# + + + + + ���������@} +reshape +x + + states_29 +shape + +var_379* +var_380 +  + +� + +@* +name + + +" +op_380~ +const% +value_states_7_perm_0 + + +*+ +name# + +" +value_states_7_perm_0*! +val + + + + + +o +const +scores_13_transpose_x_0 +*- +name% + +" +scores_13_transpose_x_0* +val + + +o +const +scores_13_transpose_y_0 +*- +name% + +" +scores_13_transpose_y_0* +val + + +z +const# +transpose_60_perm_0 + + +*) +name! + +" +transpose_60_perm_0*! +val + + + + + +z +const# +transpose_61_perm_0 + + +*) +name! + +" +transpose_61_perm_0*! +val + + + + + +� + transpose +x + +var_375 +perm + +transpose_61_perm_00 + transpose_147 +  + + +@ +�*# +name + +" + transpose_147� + transpose +x + +var_370 +perm + +transpose_60_perm_00 + transpose_148 +  + + +� +@*# +name + +" + transpose_148� +matmul +x + + transpose_148 +y + + transpose_147* + transpose_x + +scores_13_transpose_x_0* + transpose_y + +scores_13_transpose_y_0- + scores_13 +  + + +� +�* +name + + " + scores_13� +add +x + + scores_13 +y + +position_bias_3- + scores_15 +  + + +� +�* +name + + " + scores_15{ +softmax +x + + scores_15 +axis + +var_9+ +var_386 +  + + +� +�* +name + + +" +op_386j +identity +x + +var_386, +input_63 +  + + +� +�* +name + + " + +input_63o +const +states_31_transpose_x_0 +*- +name% + +" +states_31_transpose_x_0* +val + + +o +const +states_31_transpose_y_0 +*- +name% + +" +states_31_transpose_y_0* +val + + +� + transpose +x + +var_380! +perm + +value_states_7_perm_00 + transpose_149 +  + + +� +@*# +name + +" + transpose_149� +matmul +x + + +input_63 +y + + transpose_149* + transpose_x + +states_31_transpose_x_0* + transpose_y + +states_31_transpose_y_0, + states_31 +  + + +� +@* +name + + " + states_31o +const +var_390_perm_0 + + +*# +name + +" + op_390_perm_0*! +val + + + + + +j +const +var_392 + + +* +name + + +" +op_392** +val# + + + + + ����������� + transpose +x + + states_31 +perm + +var_390_perm_00 + transpose_146 +  + +� + +@*# +name + +" + transpose_146 +reshape +x + + transpose_146 +shape + +var_392& +input_65 +  + +� +�* +name + + " + +input_65� +linear +x + + +input_65B +weight8 +6 +4model_encoder_block_3_layer_0_SelfAttention_o_weight +bias + +states_1_bias_0& +input_67 +  + +� +�* +name + + " + +input_67� +add +x + +hidden_states_43 +y + + +input_67. +hidden_states_51 +  + +� +�*& +name + +" +hidden_states_51e +const +var_13_promoted_7 + *& +name + +" +op_13_promoted_7* +val +  + + + +@� +pow +x + +hidden_states_51 +y + +var_13_promoted_7% +var_402 +  + +� +�* +name + + +" +op_402g +const +var_403 + + +* +name + + +" +op_403*' +val  + + + + + +���������� + reduce_mean +x + +var_402 +axes + +var_403 + keep_dims + + +var_19( + variance_15 +  + +� +*! +name + +" + variance_15Q +const +var_405 + * +name + + +" +op_405* +val +  + + + +�7�5q +add +x + + variance_15 +y + +var_405$ +var_406 +  + +� +* +name + + +" +op_406e +const +var_407_epsilon_0 + *& +name + +" +op_407_epsilon_0* +val +  + + + +̼�+ +rsqrt +x + +var_406 +epsilon + +var_407_epsilon_0$ +var_407 +  + +� +* +name + + +" +op_407� +mul +x + +hidden_states_51 +y + +var_407. +hidden_states_55 +  + +� +�*& +name + +" +hidden_states_55� +mul8 +x3 +1 +/model_encoder_block_3_layer_1_layer_norm_weight +y + +hidden_states_55& +input_69 +  + +� +�* +name + + " + +input_69� +linear +x + + +input_69D +weight: +8 +6model_encoder_block_3_layer_1_DenseReluDense_wi_weight +bias + +input_17_bias_0& +input_71 +  + +� +�* +name + + " + +input_71a +relu +x + + +input_71& +input_73 +  + +� +�* +name + + " + +input_73� +linear +x + + +input_73D +weight: +8 +6model_encoder_block_3_layer_1_DenseReluDense_wo_weight +bias + +states_1_bias_0& +input_77 +  + +� +�* +name + + " + +input_77� +add +x + +hidden_states_51 +y + + +input_77. +hidden_states_57 +  + +� +�*& +name + +" +hidden_states_57e +const +var_13_promoted_8 + *& +name + +" +op_13_promoted_8* +val +  + + + +@� +pow +x + +hidden_states_57 +y + +var_13_promoted_8% +var_431 +  + +� +�* +name + + +" +op_431g +const +var_432 + + +* +name + + +" +op_432*' +val  + + + + + +���������� + reduce_mean +x + +var_431 +axes + +var_432 + keep_dims + + +var_19( + variance_17 +  + +� +*! +name + +" + variance_17Q +const +var_434 + * +name + + +" +op_434* +val +  + + + +�7�5q +add +x + + variance_17 +y + +var_434$ +var_435 +  + +� +* +name + + +" +op_435e +const +var_436_epsilon_0 + *& +name + +" +op_436_epsilon_0* +val +  + + + +̼�+ +rsqrt +x + +var_435 +epsilon + +var_436_epsilon_0$ +var_436 +  + +� +* +name + + +" +op_436� +mul +x + +hidden_states_57 +y + +var_436. +hidden_states_61 +  + +� +�*& +name + +" +hidden_states_61� +mul8 +x3 +1 +/model_encoder_block_4_layer_0_layer_norm_weight +y + +hidden_states_61. +hidden_states_63 +  + +� +�*& +name + +" +hidden_states_63� +linear +x + +hidden_states_63B +weight8 +6 +4model_encoder_block_4_layer_0_SelfAttention_q_weight +bias + +states_1_bias_0' + states_33 +  + +� +�* +name + + " + states_33j +const +var_449 + + +* +name + + +" +op_449** +val# + + + + + ���������@} +reshape +x + + states_33 +shape + +var_449* +var_450 +  + +� + +@* +name + + +" +op_450� +linear +x + +hidden_states_63B +weight8 +6 +4model_encoder_block_4_layer_0_SelfAttention_k_weight +bias + +states_1_bias_0' + states_35 +  + +� +�* +name + + " + states_35j +const +var_454 + + +* +name + + +" +op_454** +val# + + + + + ���������@} +reshape +x + + states_35 +shape + +var_454* +var_455 +  + +� + +@* +name + + +" +op_455� +linear +x + +hidden_states_63B +weight8 +6 +4model_encoder_block_4_layer_0_SelfAttention_v_weight +bias + +states_1_bias_0' + states_37 +  + +� +�* +name + + " + states_37j +const +var_459 + + +* +name + + +" +op_459** +val# + + + + + ���������@} +reshape +x + + states_37 +shape + +var_459* +var_460 +  + +� + +@* +name + + +" +op_460~ +const% +value_states_9_perm_0 + + +*+ +name# + +" +value_states_9_perm_0*! +val + + + + + +o +const +scores_17_transpose_x_0 +*- +name% + +" +scores_17_transpose_x_0* +val + + +o +const +scores_17_transpose_y_0 +*- +name% + +" +scores_17_transpose_y_0* +val + + +z +const# +transpose_62_perm_0 + + +*) +name! + +" +transpose_62_perm_0*! +val + + + + + +z +const# +transpose_63_perm_0 + + +*) +name! + +" +transpose_63_perm_0*! +val + + + + + +� + transpose +x + +var_455 +perm + +transpose_63_perm_00 + transpose_143 +  + + +@ +�*# +name + +" + transpose_143� + transpose +x + +var_450 +perm + +transpose_62_perm_00 + transpose_144 +  + + +� +@*# +name + +" + transpose_144� +matmul +x + + transpose_144 +y + + transpose_143* + transpose_x + +scores_17_transpose_x_0* + transpose_y + +scores_17_transpose_y_0- + scores_17 +  + + +� +�* +name + + " + scores_17� +add +x + + scores_17 +y + +position_bias_3- + scores_19 +  + + +� +�* +name + + " + scores_19{ +softmax +x + + scores_19 +axis + +var_9+ +var_466 +  + + +� +�* +name + + +" +op_466j +identity +x + +var_466, +input_81 +  + + +� +�* +name + + " + +input_81o +const +states_39_transpose_x_0 +*- +name% + +" +states_39_transpose_x_0* +val + + +o +const +states_39_transpose_y_0 +*- +name% + +" +states_39_transpose_y_0* +val + + +� + transpose +x + +var_460! +perm + +value_states_9_perm_00 + transpose_145 +  + + +� +@*# +name + +" + transpose_145� +matmul +x + + +input_81 +y + + transpose_145* + transpose_x + +states_39_transpose_x_0* + transpose_y + +states_39_transpose_y_0, + states_39 +  + + +� +@* +name + + " + states_39o +const +var_470_perm_0 + + +*# +name + +" + op_470_perm_0*! +val + + + + + +j +const +var_472 + + +* +name + + +" +op_472** +val# + + + + + ����������� + transpose +x + + states_39 +perm + +var_470_perm_00 + transpose_142 +  + +� + +@*# +name + +" + transpose_142 +reshape +x + + transpose_142 +shape + +var_472& +input_83 +  + +� +�* +name + + " + +input_83� +linear +x + + +input_83B +weight8 +6 +4model_encoder_block_4_layer_0_SelfAttention_o_weight +bias + +states_1_bias_0& +input_85 +  + +� +�* +name + + " + +input_85� +add +x + +hidden_states_57 +y + + +input_85. +hidden_states_65 +  + +� +�*& +name + +" +hidden_states_65e +const +var_13_promoted_9 + *& +name + +" +op_13_promoted_9* +val +  + + + +@� +pow +x + +hidden_states_65 +y + +var_13_promoted_9% +var_482 +  + +� +�* +name + + +" +op_482g +const +var_483 + + +* +name + + +" +op_483*' +val  + + + + + +���������� + reduce_mean +x + +var_482 +axes + +var_483 + keep_dims + + +var_19( + variance_19 +  + +� +*! +name + +" + variance_19Q +const +var_485 + * +name + + +" +op_485* +val +  + + + +�7�5q +add +x + + variance_19 +y + +var_485$ +var_486 +  + +� +* +name + + +" +op_486e +const +var_487_epsilon_0 + *& +name + +" +op_487_epsilon_0* +val +  + + + +̼�+ +rsqrt +x + +var_486 +epsilon + +var_487_epsilon_0$ +var_487 +  + +� +* +name + + +" +op_487� +mul +x + +hidden_states_65 +y + +var_487. +hidden_states_69 +  + +� +�*& +name + +" +hidden_states_69� +mul8 +x3 +1 +/model_encoder_block_4_layer_1_layer_norm_weight +y + +hidden_states_69& +input_87 +  + +� +�* +name + + " + +input_87� +linear +x + + +input_87D +weight: +8 +6model_encoder_block_4_layer_1_DenseReluDense_wi_weight +bias + +input_17_bias_0& +input_89 +  + +� +�* +name + + " + +input_89a +relu +x + + +input_89& +input_91 +  + +� +�* +name + + " + +input_91� +linear +x + + +input_91D +weight: +8 +6model_encoder_block_4_layer_1_DenseReluDense_wo_weight +bias + +states_1_bias_0& +input_95 +  + +� +�* +name + + " + +input_95� +add +x + +hidden_states_65 +y + + +input_95. +hidden_states_71 +  + +� +�*& +name + +" +hidden_states_71g +const +var_13_promoted_10 + *' +name + +" +op_13_promoted_10* +val +  + + + +@� +pow +x + +hidden_states_71 +y + +var_13_promoted_10% +var_511 +  + +� +�* +name + + +" +op_511g +const +var_512 + + +* +name + + +" +op_512*' +val  + + + + + +���������� + reduce_mean +x + +var_511 +axes + +var_512 + keep_dims + + +var_19( + variance_21 +  + +� +*! +name + +" + variance_21Q +const +var_514 + * +name + + +" +op_514* +val +  + + + +�7�5q +add +x + + variance_21 +y + +var_514$ +var_515 +  + +� +* +name + + +" +op_515e +const +var_516_epsilon_0 + *& +name + +" +op_516_epsilon_0* +val +  + + + +̼�+ +rsqrt +x + +var_515 +epsilon + +var_516_epsilon_0$ +var_516 +  + +� +* +name + + +" +op_516� +mul +x + +hidden_states_71 +y + +var_516. +hidden_states_75 +  + +� +�*& +name + +" +hidden_states_75� +mul8 +x3 +1 +/model_encoder_block_5_layer_0_layer_norm_weight +y + +hidden_states_75. +hidden_states_77 +  + +� +�*& +name + +" +hidden_states_77� +linear +x + +hidden_states_77B +weight8 +6 +4model_encoder_block_5_layer_0_SelfAttention_q_weight +bias + +states_1_bias_0' + states_41 +  + +� +�* +name + + " + states_41j +const +var_529 + + +* +name + + +" +op_529** +val# + + + + + ���������@} +reshape +x + + states_41 +shape + +var_529* +var_530 +  + +� + +@* +name + + +" +op_530� +linear +x + +hidden_states_77B +weight8 +6 +4model_encoder_block_5_layer_0_SelfAttention_k_weight +bias + +states_1_bias_0' + states_43 +  + +� +�* +name + + " + states_43j +const +var_534 + + +* +name + + +" +op_534** +val# + + + + + ���������@} +reshape +x + + states_43 +shape + +var_534* +var_535 +  + +� + +@* +name + + +" +op_535� +linear +x + +hidden_states_77B +weight8 +6 +4model_encoder_block_5_layer_0_SelfAttention_v_weight +bias + +states_1_bias_0' + states_45 +  + +� +�* +name + + " + states_45j +const +var_539 + + +* +name + + +" +op_539** +val# + + + + + ���������@} +reshape +x + + states_45 +shape + +var_539* +var_540 +  + +� + +@* +name + + +" +op_540� +const& +value_states_11_perm_0 + + +*, +name$ + +" +value_states_11_perm_0*! +val + + + + + +o +const +scores_21_transpose_x_0 +*- +name% + +" +scores_21_transpose_x_0* +val + + +o +const +scores_21_transpose_y_0 +*- +name% + +" +scores_21_transpose_y_0* +val + + +z +const# +transpose_64_perm_0 + + +*) +name! + +" +transpose_64_perm_0*! +val + + + + + +z +const# +transpose_65_perm_0 + + +*) +name! + +" +transpose_65_perm_0*! +val + + + + + +� + transpose +x + +var_535 +perm + +transpose_65_perm_00 + transpose_139 +  + + +@ +�*# +name + +" + transpose_139� + transpose +x + +var_530 +perm + +transpose_64_perm_00 + transpose_140 +  + + +� +@*# +name + +" + transpose_140� +matmul +x + + transpose_140 +y + + transpose_139* + transpose_x + +scores_21_transpose_x_0* + transpose_y + +scores_21_transpose_y_0- + scores_21 +  + + +� +�* +name + + " + scores_21� +add +x + + scores_21 +y + +position_bias_3- + scores_23 +  + + +� +�* +name + + " + scores_23{ +softmax +x + + scores_23 +axis + +var_9+ +var_546 +  + + +� +�* +name + + +" +op_546j +identity +x + +var_546, +input_99 +  + + +� +�* +name + + " + +input_99o +const +states_47_transpose_x_0 +*- +name% + +" +states_47_transpose_x_0* +val + + +o +const +states_47_transpose_y_0 +*- +name% + +" +states_47_transpose_y_0* +val + + +� + transpose +x + +var_540" +perm + +value_states_11_perm_00 + transpose_141 +  + + +� +@*# +name + +" + transpose_141� +matmul +x + + +input_99 +y + + transpose_141* + transpose_x + +states_47_transpose_x_0* + transpose_y + +states_47_transpose_y_0, + states_47 +  + + +� +@* +name + + " + states_47o +const +var_550_perm_0 + + +*# +name + +" + op_550_perm_0*! +val + + + + + +j +const +var_552 + + +* +name + + +" +op_552** +val# + + + + + ����������� + transpose +x + + states_47 +perm + +var_550_perm_00 + transpose_138 +  + +� + +@*# +name + +" + transpose_138� +reshape +x + + transpose_138 +shape + +var_552' + input_101 +  + +� +�* +name + + " + input_101� +linear +x + + input_101B +weight8 +6 +4model_encoder_block_5_layer_0_SelfAttention_o_weight +bias + +states_1_bias_0' + input_103 +  + +� +�* +name + + " + input_103� +add +x + +hidden_states_71 +y + + input_103. +hidden_states_79 +  + +� +�*& +name + +" +hidden_states_79g +const +var_13_promoted_11 + *' +name + +" +op_13_promoted_11* +val +  + + + +@� +pow +x + +hidden_states_79 +y + +var_13_promoted_11% +var_562 +  + +� +�* +name + + +" +op_562g +const +var_563 + + +* +name + + +" +op_563*' +val  + + + + + +���������� + reduce_mean +x + +var_562 +axes + +var_563 + keep_dims + + +var_19( + variance_23 +  + +� +*! +name + +" + variance_23Q +const +var_565 + * +name + + +" +op_565* +val +  + + + +�7�5q +add +x + + variance_23 +y + +var_565$ +var_566 +  + +� +* +name + + +" +op_566e +const +var_567_epsilon_0 + *& +name + +" +op_567_epsilon_0* +val +  + + + +̼�+ +rsqrt +x + +var_566 +epsilon + +var_567_epsilon_0$ +var_567 +  + +� +* +name + + +" +op_567� +mul +x + +hidden_states_79 +y + +var_567. +hidden_states_83 +  + +� +�*& +name + +" +hidden_states_83� +mul8 +x3 +1 +/model_encoder_block_5_layer_1_layer_norm_weight +y + +hidden_states_83' + input_105 +  + +� +�* +name + + " + input_105� +linear +x + + input_105D +weight: +8 +6model_encoder_block_5_layer_1_DenseReluDense_wi_weight +bias + +input_17_bias_0' + input_107 +  + +� +�* +name + + " + input_107d +relu +x + + input_107' + input_109 +  + +� +�* +name + + " + input_109� +linear +x + + input_109D +weight: +8 +6model_encoder_block_5_layer_1_DenseReluDense_wo_weight +bias + +states_1_bias_0' + input_113 +  + +� +�* +name + + " + input_113� +add +x + +hidden_states_79 +y + + input_113. +hidden_states_85 +  + +� +�*& +name + +" +hidden_states_85g +const +var_13_promoted_12 + *' +name + +" +op_13_promoted_12* +val +  + + + +@� +pow +x + +hidden_states_85 +y + +var_13_promoted_12% +var_585 +  + +� +�* +name + + +" +op_585g +const +var_586 + + +* +name + + +" +op_586*' +val  + + + + + +���������� + reduce_mean +x + +var_585 +axes + +var_586 + keep_dims + + +var_19( + variance_25 +  + +� +*! +name + +" + variance_25Q +const +var_588 + * +name + + +" +op_588* +val +  + + + +�7�5q +add +x + + variance_25 +y + +var_588$ +var_589 +  + +� +* +name + + +" +op_589e +const +var_590_epsilon_0 + *& +name + +" +op_590_epsilon_0* +val +  + + + +̼�+ +rsqrt +x + +var_589 +epsilon + +var_590_epsilon_0$ +var_590 +  + +� +* +name + + +" +op_590� +mul +x + +hidden_states_85 +y + +var_590. +hidden_states_89 +  + +� +�*& +name + +" +hidden_states_89� +mul. +x) +' +%model_encoder_final_layer_norm_weight +y + +hidden_states_89' + input_115 +  + +� +�* +name + + " + input_115a +const +input_119_axis_0 +*& +name + +" +input_119_axis_0* +val + + +� +gather +x + +model_shared_weight +indices + +decoder_input_ids +axis + +input_119_axis_0& + input_119 +  + +{ +�* +name + + " + input_119�w +const) +var_624 + + + +{ +{* +name + + +" +op_624*�v +val�v + + + +{ +{�v +�v�v +�vl +const +var_628_axes_0 + + +*# +name + +" + op_628_axes_0* +val + + + + +� + expand_dims +x + +decoder_attention_mask +axes + +var_628_axes_0# +var_628 + + + +{* +name + + +" +op_628l +const +var_629_axes_0 + + +*# +name + +" + op_629_axes_0* +val + + + + +� + expand_dims +x + +var_628 +axes + +var_629_axes_0) +var_629 + + + + +{* +name + + +" +op_629� +mul +x + +var_624 +y + +var_6299 +extended_attention_mask + + + +{ +{*- +name% + +" +extended_attention_maska +const +var_632_dtype_0 +*$ +name + +" +op_632_dtype_0* +val + + +" +fp32� +cast +x + +extended_attention_mask +dtype + +var_632_dtype_0) +cast_86 +  + + +{ +{* +name + + " +cast_86q +sub +x + + +var_17 +y + +cast_86) +var_633 +  + + +{ +{* +name + + +" +op_633Q +const +var_634 + * +name + + +" +op_634* +val +  + + + +���q +mul +x + +var_633 +y + +var_634( +mask_3 +  + + +{ +{* +name + + +" +mask_3g +const +var_13_promoted_13 + *' +name + +" +op_13_promoted_13* +val +  + + + +@z +pow +x + + input_119 +y + +var_13_promoted_13$ +var_655 +  + +{ +�* +name + + +" +op_655g +const +var_656 + + +* +name + + +" +op_656*' +val  + + + + + +���������� + reduce_mean +x + +var_655 +axes + +var_656 + keep_dims + + +var_19' + variance_27 +  + +{ +*! +name + +" + variance_27Q +const +var_658 + * +name + + +" +op_658* +val +  + + + +�7�5p +add +x + + variance_27 +y + +var_658# +var_659 +  + +{ +* +name + + +" +op_659e +const +var_660_epsilon_0 + *& +name + +" +op_660_epsilon_0* +val +  + + + +̼�+~ +rsqrt +x + +var_659 +epsilon + +var_660_epsilon_0# +var_660 +  + +{ +* +name + + +" +op_660� +mul +x + + input_119 +y + +var_660- +hidden_states_95 +  + +{ +�*& +name + +" +hidden_states_95� +mul8 +x3 +1 +/model_decoder_block_0_layer_0_layer_norm_weight +y + +hidden_states_95- +hidden_states_97 +  + +{ +�*& +name + +" +hidden_states_97� +linear +x + +hidden_states_97B +weight8 +6 +4model_decoder_block_0_layer_0_SelfAttention_q_weight +bias + +states_1_bias_0& + states_49 +  + +{ +�* +name + + " + states_49j +const +var_675 + + +* +name + + +" +op_675** +val# + + + + + ���������@| +reshape +x + + states_49 +shape + +var_675) +var_676 +  + +{ + +@* +name + + +" +op_676� +linear +x + +hidden_states_97B +weight8 +6 +4model_decoder_block_0_layer_0_SelfAttention_k_weight +bias + +states_1_bias_0& + states_51 +  + +{ +�* +name + + " + states_51j +const +var_680 + + +* +name + + +" +op_680** +val# + + + + + ���������@| +reshape +x + + states_51 +shape + +var_680) +var_681 +  + +{ + +@* +name + + +" +op_681� +linear +x + +hidden_states_97B +weight8 +6 +4model_decoder_block_0_layer_0_SelfAttention_v_weight +bias + +states_1_bias_0& + states_53 +  + +{ +�* +name + + " + states_53j +const +var_685 + + +* +name + + +" +op_685** +val# + + + + + ���������@| +reshape +x + + states_53 +shape + +var_685) +var_686 +  + +{ + +@* +name + + +" +op_686� +const& +value_states_13_perm_0 + + +*, +name$ + +" +value_states_13_perm_0*! +val + + + + + +o +const +scores_25_transpose_x_0 +*- +name% + +" +scores_25_transpose_x_0* +val + + +o +const +scores_25_transpose_y_0 +*- +name% + +" +scores_25_transpose_y_0* +val + + +z +const# +transpose_66_perm_0 + + +*) +name! + +" +transpose_66_perm_0*! +val + + + + + +z +const# +transpose_67_perm_0 + + +*) +name! + +" +transpose_67_perm_0*! +val + + + + + +� + transpose +x + +var_681 +perm + +transpose_67_perm_0/ + transpose_135 +  + + +@ +{*# +name + +" + transpose_135� + transpose +x + +var_676 +perm + +transpose_66_perm_0/ + transpose_136 +  + + +{ +@*# +name + +" + transpose_136� +matmul +x + + transpose_136 +y + + transpose_135* + transpose_x + +scores_25_transpose_x_0* + transpose_y + +scores_25_transpose_y_0+ + scores_25 +  + + +{ +{* +name + + " + scores_25� +const1 +position_bias_5 +  + + +{ +{*% +name + +" +position_bias_5*N +valG +  + + +{ +{*% +@model_path/weights/weight.bin���s� +add +x + +position_bias_5 +y + + +mask_31 +position_bias_7 +  + + +{ +{*% +name + +" +position_bias_7� +add +x + + scores_25 +y + +position_bias_7+ + scores_27 +  + + +{ +{* +name + + " + scores_27y +softmax +x + + scores_27 +axis + +var_9) +var_725 +  + + +{ +{* +name + + +" +op_725j +identity +x + +var_725+ + input_125 +  + + +{ +{* +name + + " + input_125o +const +states_55_transpose_x_0 +*- +name% + +" +states_55_transpose_x_0* +val + + +o +const +states_55_transpose_y_0 +*- +name% + +" +states_55_transpose_y_0* +val + + +� + transpose +x + +var_686" +perm + +value_states_13_perm_0/ + transpose_137 +  + + +{ +@*# +name + +" + transpose_137� +matmul +x + + input_125 +y + + transpose_137* + transpose_x + +states_55_transpose_x_0* + transpose_y + +states_55_transpose_y_0+ + states_55 +  + + +{ +@* +name + + " + states_55o +const +var_729_perm_0 + + +*# +name + +" + op_729_perm_0*! +val + + + + + +j +const +var_731 + + +* +name + + +" +op_731** +val# + + + + + ����������� + transpose +x + + states_55 +perm + +var_729_perm_0/ + transpose_134 +  + +{ + +@*# +name + +" + transpose_134� +reshape +x + + transpose_134 +shape + +var_731& + input_127 +  + +{ +�* +name + + " + input_127� +linear +x + + input_127B +weight8 +6 +4model_decoder_block_0_layer_0_SelfAttention_o_weight +bias + +states_1_bias_0& + input_129 +  + +{ +�* +name + + " + input_129� +add +x + + input_119 +y + + input_129- +hidden_states_99 +  + +{ +�*& +name + +" +hidden_states_99g +const +var_13_promoted_14 + *' +name + +" +op_13_promoted_14* +val +  + + + +@� +pow +x + +hidden_states_99 +y + +var_13_promoted_14$ +var_747 +  + +{ +�* +name + + +" +op_747g +const +var_748 + + +* +name + + +" +op_748*' +val  + + + + + +���������� + reduce_mean +x + +var_747 +axes + +var_748 + keep_dims + + +var_19' + variance_29 +  + +{ +*! +name + +" + variance_29Q +const +var_750 + * +name + + +" +op_750* +val +  + + + +�7�5p +add +x + + variance_29 +y + +var_750# +var_751 +  + +{ +* +name + + +" +op_751e +const +var_752_epsilon_0 + *& +name + +" +op_752_epsilon_0* +val +  + + + +̼�+~ +rsqrt +x + +var_751 +epsilon + +var_752_epsilon_0# +var_752 +  + +{ +* +name + + +" +op_752� +mul +x + +hidden_states_99 +y + +var_752. +hidden_states_103 +  + +{ +�*' +name + +" +hidden_states_103� +mul8 +x3 +1 +/model_decoder_block_0_layer_1_layer_norm_weight +y + +hidden_states_103. +hidden_states_105 +  + +{ +�*' +name + +" +hidden_states_105� +linear +x + +hidden_states_105D +weight: +8 +6model_decoder_block_0_layer_1_EncDecAttention_q_weight +bias + +states_1_bias_0& + states_57 +  + +{ +�* +name + + " + states_57j +const +var_767 + + +* +name + + +" +op_767** +val# + + + + + ���������@| +reshape +x + + states_57 +shape + +var_767) +var_768 +  + +{ + +@* +name + + +" +op_768� +linear +x + + input_115D +weight: +8 +6model_decoder_block_0_layer_1_EncDecAttention_k_weight +bias + +states_1_bias_0' + states_59 +  + +� +�* +name + + " + states_59j +const +var_772 + + +* +name + + +" +op_772** +val# + + + + + ���������@} +reshape +x + + states_59 +shape + +var_772* +var_773 +  + +� + +@* +name + + +" +op_773� +linear +x + + input_115D +weight: +8 +6model_decoder_block_0_layer_1_EncDecAttention_v_weight +bias + +states_1_bias_0' + states_61 +  + +� +�* +name + + " + states_61j +const +var_777 + + +* +name + + +" +op_777** +val# + + + + + ���������@} +reshape +x + + states_61 +shape + +var_777* +var_778 +  + +� + +@* +name + + +" +op_778� +const& +value_states_15_perm_0 + + +*, +name$ + +" +value_states_15_perm_0*! +val + + + + + +o +const +scores_29_transpose_x_0 +*- +name% + +" +scores_29_transpose_x_0* +val + + +o +const +scores_29_transpose_y_0 +*- +name% + +" +scores_29_transpose_y_0* +val + + +z +const# +transpose_68_perm_0 + + +*) +name! + +" +transpose_68_perm_0*! +val + + + + + +z +const# +transpose_69_perm_0 + + +*) +name! + +" +transpose_69_perm_0*! +val + + + + + +� + transpose +x + +var_773 +perm + +transpose_69_perm_00 + transpose_131 +  + + +@ +�*# +name + +" + transpose_131� + transpose +x + +var_768 +perm + +transpose_68_perm_0/ + transpose_132 +  + + +{ +@*# +name + +" + transpose_132� +matmul +x + + transpose_132 +y + + transpose_131* + transpose_x + +scores_29_transpose_x_0* + transpose_y + +scores_29_transpose_y_0, + scores_29 +  + + +{ +�* +name + + " + scores_29� +const2 +position_bias_9 +  + + +{ +�*% +name + +" +position_bias_9*O +valH +  + + +{ +�*% +@model_path/weights/weight.bin���s� +add +x + +position_bias_9 +y + + +mask_10 + position_bias +  + + +{ +�*# +name + +" + position_bias� +add +x + + scores_29 +y + + position_bias, + scores_31 +  + + +{ +�* +name + + " + scores_31z +softmax +x + + scores_31 +axis + +var_9* +var_787 +  + + +{ +�* +name + + +" +op_787k +identity +x + +var_787, + input_133 +  + + +{ +�* +name + + " + input_133o +const +states_63_transpose_x_0 +*- +name% + +" +states_63_transpose_x_0* +val + + +o +const +states_63_transpose_y_0 +*- +name% + +" +states_63_transpose_y_0* +val + + +� + transpose +x + +var_778" +perm + +value_states_15_perm_00 + transpose_133 +  + + +� +@*# +name + +" + transpose_133� +matmul +x + + input_133 +y + + transpose_133* + transpose_x + +states_63_transpose_x_0* + transpose_y + +states_63_transpose_y_0+ + states_63 +  + + +{ +@* +name + + " + states_63o +const +var_791_perm_0 + + +*# +name + +" + op_791_perm_0*! +val + + + + + +j +const +var_793 + + +* +name + + +" +op_793** +val# + + + + + ����������� + transpose +x + + states_63 +perm + +var_791_perm_0/ + transpose_130 +  + +{ + +@*# +name + +" + transpose_130� +reshape +x + + transpose_130 +shape + +var_793& + input_135 +  + +{ +�* +name + + " + input_135� +linear +x + + input_135D +weight: +8 +6model_decoder_block_0_layer_1_EncDecAttention_o_weight +bias + +states_1_bias_0& + input_137 +  + +{ +�* +name + + " + input_137� +add +x + +hidden_states_99 +y + + input_137. +hidden_states_107 +  + +{ +�*' +name + +" +hidden_states_107g +const +var_13_promoted_15 + *' +name + +" +op_13_promoted_15* +val +  + + + +@� +pow +x + +hidden_states_107 +y + +var_13_promoted_15$ +var_809 +  + +{ +�* +name + + +" +op_809g +const +var_810 + + +* +name + + +" +op_810*' +val  + + + + + +���������� + reduce_mean +x + +var_809 +axes + +var_810 + keep_dims + + +var_19' + variance_31 +  + +{ +*! +name + +" + variance_31Q +const +var_812 + * +name + + +" +op_812* +val +  + + + +�7�5p +add +x + + variance_31 +y + +var_812# +var_813 +  + +{ +* +name + + +" +op_813e +const +var_814_epsilon_0 + *& +name + +" +op_814_epsilon_0* +val +  + + + +̼�+~ +rsqrt +x + +var_813 +epsilon + +var_814_epsilon_0# +var_814 +  + +{ +* +name + + +" +op_814� +mul +x + +hidden_states_107 +y + +var_814. +hidden_states_111 +  + +{ +�*' +name + +" +hidden_states_111� +mul8 +x3 +1 +/model_decoder_block_0_layer_2_layer_norm_weight +y + +hidden_states_111& + input_139 +  + +{ +�* +name + + " + input_139� +linear +x + + input_139D +weight: +8 +6model_decoder_block_0_layer_2_DenseReluDense_wi_weight +bias + +input_17_bias_0& + input_141 +  + +{ +�* +name + + " + input_141c +relu +x + + input_141& + input_143 +  + +{ +�* +name + + " + input_143� +linear +x + + input_143D +weight: +8 +6model_decoder_block_0_layer_2_DenseReluDense_wo_weight +bias + +states_1_bias_0& + input_147 +  + +{ +�* +name + + " + input_147� +add +x + +hidden_states_107 +y + + input_147. +hidden_states_113 +  + +{ +�*' +name + +" +hidden_states_113g +const +var_13_promoted_16 + *' +name + +" +op_13_promoted_16* +val +  + + + +@� +pow +x + +hidden_states_113 +y + +var_13_promoted_16$ +var_844 +  + +{ +�* +name + + +" +op_844g +const +var_845 + + +* +name + + +" +op_845*' +val  + + + + + +���������� + reduce_mean +x + +var_844 +axes + +var_845 + keep_dims + + +var_19' + variance_33 +  + +{ +*! +name + +" + variance_33Q +const +var_847 + * +name + + +" +op_847* +val +  + + + +�7�5p +add +x + + variance_33 +y + +var_847# +var_848 +  + +{ +* +name + + +" +op_848e +const +var_849_epsilon_0 + *& +name + +" +op_849_epsilon_0* +val +  + + + +̼�+~ +rsqrt +x + +var_848 +epsilon + +var_849_epsilon_0# +var_849 +  + +{ +* +name + + +" +op_849� +mul +x + +hidden_states_113 +y + +var_849. +hidden_states_117 +  + +{ +�*' +name + +" +hidden_states_117� +mul8 +x3 +1 +/model_decoder_block_1_layer_0_layer_norm_weight +y + +hidden_states_117. +hidden_states_119 +  + +{ +�*' +name + +" +hidden_states_119� +linear +x + +hidden_states_119B +weight8 +6 +4model_decoder_block_1_layer_0_SelfAttention_q_weight +bias + +states_1_bias_0& + states_65 +  + +{ +�* +name + + " + states_65j +const +var_862 + + +* +name + + +" +op_862** +val# + + + + + ���������@| +reshape +x + + states_65 +shape + +var_862) +var_863 +  + +{ + +@* +name + + +" +op_863� +linear +x + +hidden_states_119B +weight8 +6 +4model_decoder_block_1_layer_0_SelfAttention_k_weight +bias + +states_1_bias_0& + states_67 +  + +{ +�* +name + + " + states_67j +const +var_867 + + +* +name + + +" +op_867** +val# + + + + + ���������@| +reshape +x + + states_67 +shape + +var_867) +var_868 +  + +{ + +@* +name + + +" +op_868� +linear +x + +hidden_states_119B +weight8 +6 +4model_decoder_block_1_layer_0_SelfAttention_v_weight +bias + +states_1_bias_0& + states_69 +  + +{ +�* +name + + " + states_69j +const +var_872 + + +* +name + + +" +op_872** +val# + + + + + ���������@| +reshape +x + + states_69 +shape + +var_872) +var_873 +  + +{ + +@* +name + + +" +op_873� +const& +value_states_17_perm_0 + + +*, +name$ + +" +value_states_17_perm_0*! +val + + + + + +o +const +scores_33_transpose_x_0 +*- +name% + +" +scores_33_transpose_x_0* +val + + +o +const +scores_33_transpose_y_0 +*- +name% + +" +scores_33_transpose_y_0* +val + + +z +const# +transpose_70_perm_0 + + +*) +name! + +" +transpose_70_perm_0*! +val + + + + + +z +const# +transpose_71_perm_0 + + +*) +name! + +" +transpose_71_perm_0*! +val + + + + + +� + transpose +x + +var_868 +perm + +transpose_71_perm_0/ + transpose_127 +  + + +@ +{*# +name + +" + transpose_127� + transpose +x + +var_863 +perm + +transpose_70_perm_0/ + transpose_128 +  + + +{ +@*# +name + +" + transpose_128� +matmul +x + + transpose_128 +y + + transpose_127* + transpose_x + +scores_33_transpose_x_0* + transpose_y + +scores_33_transpose_y_0+ + scores_33 +  + + +{ +{* +name + + " + scores_33� +add +x + + scores_33 +y + +position_bias_7+ + scores_35 +  + + +{ +{* +name + + " + scores_35y +softmax +x + + scores_35 +axis + +var_9) +var_879 +  + + +{ +{* +name + + +" +op_879j +identity +x + +var_879+ + input_151 +  + + +{ +{* +name + + " + input_151o +const +states_71_transpose_x_0 +*- +name% + +" +states_71_transpose_x_0* +val + + +o +const +states_71_transpose_y_0 +*- +name% + +" +states_71_transpose_y_0* +val + + +� + transpose +x + +var_873" +perm + +value_states_17_perm_0/ + transpose_129 +  + + +{ +@*# +name + +" + transpose_129� +matmul +x + + input_151 +y + + transpose_129* + transpose_x + +states_71_transpose_x_0* + transpose_y + +states_71_transpose_y_0+ + states_71 +  + + +{ +@* +name + + " + states_71o +const +var_883_perm_0 + + +*# +name + +" + op_883_perm_0*! +val + + + + + +j +const +var_885 + + +* +name + + +" +op_885** +val# + + + + + ����������� + transpose +x + + states_71 +perm + +var_883_perm_0/ + transpose_126 +  + +{ + +@*# +name + +" + transpose_126� +reshape +x + + transpose_126 +shape + +var_885& + input_153 +  + +{ +�* +name + + " + input_153� +linear +x + + input_153B +weight8 +6 +4model_decoder_block_1_layer_0_SelfAttention_o_weight +bias + +states_1_bias_0& + input_155 +  + +{ +�* +name + + " + input_155� +add +x + +hidden_states_113 +y + + input_155. +hidden_states_121 +  + +{ +�*' +name + +" +hidden_states_121g +const +var_13_promoted_17 + *' +name + +" +op_13_promoted_17* +val +  + + + +@� +pow +x + +hidden_states_121 +y + +var_13_promoted_17$ +var_895 +  + +{ +�* +name + + +" +op_895g +const +var_896 + + +* +name + + +" +op_896*' +val  + + + + + +���������� + reduce_mean +x + +var_895 +axes + +var_896 + keep_dims + + +var_19' + variance_35 +  + +{ +*! +name + +" + variance_35Q +const +var_898 + * +name + + +" +op_898* +val +  + + + +�7�5p +add +x + + variance_35 +y + +var_898# +var_899 +  + +{ +* +name + + +" +op_899e +const +var_900_epsilon_0 + *& +name + +" +op_900_epsilon_0* +val +  + + + +̼�+~ +rsqrt +x + +var_899 +epsilon + +var_900_epsilon_0# +var_900 +  + +{ +* +name + + +" +op_900� +mul +x + +hidden_states_121 +y + +var_900. +hidden_states_125 +  + +{ +�*' +name + +" +hidden_states_125� +mul8 +x3 +1 +/model_decoder_block_1_layer_1_layer_norm_weight +y + +hidden_states_125. +hidden_states_127 +  + +{ +�*' +name + +" +hidden_states_127� +linear +x + +hidden_states_127D +weight: +8 +6model_decoder_block_1_layer_1_EncDecAttention_q_weight +bias + +states_1_bias_0& + states_73 +  + +{ +�* +name + + " + states_73j +const +var_913 + + +* +name + + +" +op_913** +val# + + + + + ���������@| +reshape +x + + states_73 +shape + +var_913) +var_914 +  + +{ + +@* +name + + +" +op_914� +linear +x + + input_115D +weight: +8 +6model_decoder_block_1_layer_1_EncDecAttention_k_weight +bias + +states_1_bias_0' + states_75 +  + +� +�* +name + + " + states_75j +const +var_918 + + +* +name + + +" +op_918** +val# + + + + + ���������@} +reshape +x + + states_75 +shape + +var_918* +var_919 +  + +� + +@* +name + + +" +op_919� +linear +x + + input_115D +weight: +8 +6model_decoder_block_1_layer_1_EncDecAttention_v_weight +bias + +states_1_bias_0' + states_77 +  + +� +�* +name + + " + states_77j +const +var_923 + + +* +name + + +" +op_923** +val# + + + + + ���������@} +reshape +x + + states_77 +shape + +var_923* +var_924 +  + +� + +@* +name + + +" +op_924� +const& +value_states_19_perm_0 + + +*, +name$ + +" +value_states_19_perm_0*! +val + + + + + +o +const +scores_37_transpose_x_0 +*- +name% + +" +scores_37_transpose_x_0* +val + + +o +const +scores_37_transpose_y_0 +*- +name% + +" +scores_37_transpose_y_0* +val + + +z +const# +transpose_72_perm_0 + + +*) +name! + +" +transpose_72_perm_0*! +val + + + + + +z +const# +transpose_73_perm_0 + + +*) +name! + +" +transpose_73_perm_0*! +val + + + + + +� + transpose +x + +var_919 +perm + +transpose_73_perm_00 + transpose_123 +  + + +@ +�*# +name + +" + transpose_123� + transpose +x + +var_914 +perm + +transpose_72_perm_0/ + transpose_124 +  + + +{ +@*# +name + +" + transpose_124� +matmul +x + + transpose_124 +y + + transpose_123* + transpose_x + +scores_37_transpose_x_0* + transpose_y + +scores_37_transpose_y_0, + scores_37 +  + + +{ +�* +name + + " + scores_37� +add +x + + scores_37 +y + + position_bias, + scores_39 +  + + +{ +�* +name + + " + scores_39z +softmax +x + + scores_39 +axis + +var_9* +var_930 +  + + +{ +�* +name + + +" +op_930k +identity +x + +var_930, + input_159 +  + + +{ +�* +name + + " + input_159o +const +states_79_transpose_x_0 +*- +name% + +" +states_79_transpose_x_0* +val + + +o +const +states_79_transpose_y_0 +*- +name% + +" +states_79_transpose_y_0* +val + + +� + transpose +x + +var_924" +perm + +value_states_19_perm_00 + transpose_125 +  + + +� +@*# +name + +" + transpose_125� +matmul +x + + input_159 +y + + transpose_125* + transpose_x + +states_79_transpose_x_0* + transpose_y + +states_79_transpose_y_0+ + states_79 +  + + +{ +@* +name + + " + states_79o +const +var_934_perm_0 + + +*# +name + +" + op_934_perm_0*! +val + + + + + +j +const +var_936 + + +* +name + + +" +op_936** +val# + + + + + ����������� + transpose +x + + states_79 +perm + +var_934_perm_0/ + transpose_122 +  + +{ + +@*# +name + +" + transpose_122� +reshape +x + + transpose_122 +shape + +var_936& + input_161 +  + +{ +�* +name + + " + input_161� +linear +x + + input_161D +weight: +8 +6model_decoder_block_1_layer_1_EncDecAttention_o_weight +bias + +states_1_bias_0& + input_163 +  + +{ +�* +name + + " + input_163� +add +x + +hidden_states_121 +y + + input_163. +hidden_states_129 +  + +{ +�*' +name + +" +hidden_states_129g +const +var_13_promoted_18 + *' +name + +" +op_13_promoted_18* +val +  + + + +@� +pow +x + +hidden_states_129 +y + +var_13_promoted_18$ +var_946 +  + +{ +�* +name + + +" +op_946g +const +var_947 + + +* +name + + +" +op_947*' +val  + + + + + +���������� + reduce_mean +x + +var_946 +axes + +var_947 + keep_dims + + +var_19' + variance_37 +  + +{ +*! +name + +" + variance_37Q +const +var_949 + * +name + + +" +op_949* +val +  + + + +�7�5p +add +x + + variance_37 +y + +var_949# +var_950 +  + +{ +* +name + + +" +op_950e +const +var_951_epsilon_0 + *& +name + +" +op_951_epsilon_0* +val +  + + + +̼�+~ +rsqrt +x + +var_950 +epsilon + +var_951_epsilon_0# +var_951 +  + +{ +* +name + + +" +op_951� +mul +x + +hidden_states_129 +y + +var_951. +hidden_states_133 +  + +{ +�*' +name + +" +hidden_states_133� +mul8 +x3 +1 +/model_decoder_block_1_layer_2_layer_norm_weight +y + +hidden_states_133& + input_165 +  + +{ +�* +name + + " + input_165� +linear +x + + input_165D +weight: +8 +6model_decoder_block_1_layer_2_DenseReluDense_wi_weight +bias + +input_17_bias_0& + input_167 +  + +{ +�* +name + + " + input_167c +relu +x + + input_167& + input_169 +  + +{ +�* +name + + " + input_169� +linear +x + + input_169D +weight: +8 +6model_decoder_block_1_layer_2_DenseReluDense_wo_weight +bias + +states_1_bias_0& + input_173 +  + +{ +�* +name + + " + input_173� +add +x + +hidden_states_129 +y + + input_173. +hidden_states_135 +  + +{ +�*' +name + +" +hidden_states_135g +const +var_13_promoted_19 + *' +name + +" +op_13_promoted_19* +val +  + + + +@� +pow +x + +hidden_states_135 +y + +var_13_promoted_19$ +var_977 +  + +{ +�* +name + + +" +op_977g +const +var_978 + + +* +name + + +" +op_978*' +val  + + + + + +���������� + reduce_mean +x + +var_977 +axes + +var_978 + keep_dims + + +var_19' + variance_39 +  + +{ +*! +name + +" + variance_39Q +const +var_980 + * +name + + +" +op_980* +val +  + + + +�7�5p +add +x + + variance_39 +y + +var_980# +var_981 +  + +{ +* +name + + +" +op_981e +const +var_982_epsilon_0 + *& +name + +" +op_982_epsilon_0* +val +  + + + +̼�+~ +rsqrt +x + +var_981 +epsilon + +var_982_epsilon_0# +var_982 +  + +{ +* +name + + +" +op_982� +mul +x + +hidden_states_135 +y + +var_982. +hidden_states_139 +  + +{ +�*' +name + +" +hidden_states_139� +mul8 +x3 +1 +/model_decoder_block_2_layer_0_layer_norm_weight +y + +hidden_states_139. +hidden_states_141 +  + +{ +�*' +name + +" +hidden_states_141� +linear +x + +hidden_states_141B +weight8 +6 +4model_decoder_block_2_layer_0_SelfAttention_q_weight +bias + +states_1_bias_0& + states_81 +  + +{ +�* +name + + " + states_81j +const +var_995 + + +* +name + + +" +op_995** +val# + + + + + ���������@| +reshape +x + + states_81 +shape + +var_995) +var_996 +  + +{ + +@* +name + + +" +op_996� +linear +x + +hidden_states_141B +weight8 +6 +4model_decoder_block_2_layer_0_SelfAttention_k_weight +bias + +states_1_bias_0& + states_83 +  + +{ +�* +name + + " + states_83l +const +var_1000 + + +* +name + + " +op_1000** +val# + + + + + ���������@ +reshape +x + + states_83 +shape + + +var_1000* +var_1001 +  + +{ + +@* +name + + " +op_1001� +linear +x + +hidden_states_141B +weight8 +6 +4model_decoder_block_2_layer_0_SelfAttention_v_weight +bias + +states_1_bias_0& + states_85 +  + +{ +�* +name + + " + states_85l +const +var_1005 + + +* +name + + " +op_1005** +val# + + + + + ���������@ +reshape +x + + states_85 +shape + + +var_1005* +var_1006 +  + +{ + +@* +name + + " +op_1006� +const& +value_states_21_perm_0 + + +*, +name$ + +" +value_states_21_perm_0*! +val + + + + + +o +const +scores_41_transpose_x_0 +*- +name% + +" +scores_41_transpose_x_0* +val + + +o +const +scores_41_transpose_y_0 +*- +name% + +" +scores_41_transpose_y_0* +val + + +z +const# +transpose_74_perm_0 + + +*) +name! + +" +transpose_74_perm_0*! +val + + + + + +z +const# +transpose_75_perm_0 + + +*) +name! + +" +transpose_75_perm_0*! +val + + + + + +� + transpose +x + + +var_1001 +perm + +transpose_75_perm_0/ + transpose_119 +  + + +@ +{*# +name + +" + transpose_119� + transpose +x + +var_996 +perm + +transpose_74_perm_0/ + transpose_120 +  + + +{ +@*# +name + +" + transpose_120� +matmul +x + + transpose_120 +y + + transpose_119* + transpose_x + +scores_41_transpose_x_0* + transpose_y + +scores_41_transpose_y_0+ + scores_41 +  + + +{ +{* +name + + " + scores_41� +add +x + + scores_41 +y + +position_bias_7+ + scores_43 +  + + +{ +{* +name + + " + scores_43{ +softmax +x + + scores_43 +axis + +var_9* +var_1012 +  + + +{ +{* +name + + " +op_1012k +identity +x + + +var_1012+ + input_177 +  + + +{ +{* +name + + " + input_177o +const +states_87_transpose_x_0 +*- +name% + +" +states_87_transpose_x_0* +val + + +o +const +states_87_transpose_y_0 +*- +name% + +" +states_87_transpose_y_0* +val + + +� + transpose +x + + +var_1006" +perm + +value_states_21_perm_0/ + transpose_121 +  + + +{ +@*# +name + +" + transpose_121� +matmul +x + + input_177 +y + + transpose_121* + transpose_x + +states_87_transpose_x_0* + transpose_y + +states_87_transpose_y_0+ + states_87 +  + + +{ +@* +name + + " + states_87q +const +var_1016_perm_0 + + +*$ +name + +" +op_1016_perm_0*! +val + + + + + +l +const +var_1018 + + +* +name + + " +op_1018** +val# + + + + + ����������� + transpose +x + + states_87 +perm + +var_1016_perm_0/ + transpose_118 +  + +{ + +@*# +name + +" + transpose_118� +reshape +x + + transpose_118 +shape + + +var_1018& + input_179 +  + +{ +�* +name + + " + input_179� +linear +x + + input_179B +weight8 +6 +4model_decoder_block_2_layer_0_SelfAttention_o_weight +bias + +states_1_bias_0& + input_181 +  + +{ +�* +name + + " + input_181� +add +x + +hidden_states_135 +y + + input_181. +hidden_states_143 +  + +{ +�*' +name + +" +hidden_states_143g +const +var_13_promoted_20 + *' +name + +" +op_13_promoted_20* +val +  + + + +@� +pow +x + +hidden_states_143 +y + +var_13_promoted_20% +var_1028 +  + +{ +�* +name + + " +op_1028i +const +var_1029 + + +* +name + + " +op_1029*' +val  + + + + + +���������� + reduce_mean +x + + +var_1028 +axes + + +var_1029 + keep_dims + + +var_19' + variance_41 +  + +{ +*! +name + +" + variance_41S +const +var_1031 + * +name + + " +op_1031* +val +  + + + +�7�5s +add +x + + variance_41 +y + + +var_1031$ +var_1032 +  + +{ +* +name + + " +op_1032g +const +var_1033_epsilon_0 + *' +name + +" +op_1033_epsilon_0* +val +  + + + +̼�+� +rsqrt +x + + +var_1032! +epsilon + +var_1033_epsilon_0$ +var_1033 +  + +{ +* +name + + " +op_1033� +mul +x + +hidden_states_143 +y + + +var_1033. +hidden_states_147 +  + +{ +�*' +name + +" +hidden_states_147� +mul8 +x3 +1 +/model_decoder_block_2_layer_1_layer_norm_weight +y + +hidden_states_147. +hidden_states_149 +  + +{ +�*' +name + +" +hidden_states_149� +linear +x + +hidden_states_149D +weight: +8 +6model_decoder_block_2_layer_1_EncDecAttention_q_weight +bias + +states_1_bias_0& + states_89 +  + +{ +�* +name + + " + states_89l +const +var_1046 + + +* +name + + " +op_1046** +val# + + + + + ���������@ +reshape +x + + states_89 +shape + + +var_1046* +var_1047 +  + +{ + +@* +name + + " +op_1047� +linear +x + + input_115D +weight: +8 +6model_decoder_block_2_layer_1_EncDecAttention_k_weight +bias + +states_1_bias_0' + states_91 +  + +� +�* +name + + " + states_91l +const +var_1051 + + +* +name + + " +op_1051** +val# + + + + + ���������@� +reshape +x + + states_91 +shape + + +var_1051+ +var_1052 +  + +� + +@* +name + + " +op_1052� +linear +x + + input_115D +weight: +8 +6model_decoder_block_2_layer_1_EncDecAttention_v_weight +bias + +states_1_bias_0' + states_93 +  + +� +�* +name + + " + states_93l +const +var_1056 + + +* +name + + " +op_1056** +val# + + + + + ���������@� +reshape +x + + states_93 +shape + + +var_1056+ +var_1057 +  + +� + +@* +name + + " +op_1057� +const& +value_states_23_perm_0 + + +*, +name$ + +" +value_states_23_perm_0*! +val + + + + + +o +const +scores_45_transpose_x_0 +*- +name% + +" +scores_45_transpose_x_0* +val + + +o +const +scores_45_transpose_y_0 +*- +name% + +" +scores_45_transpose_y_0* +val + + +z +const# +transpose_76_perm_0 + + +*) +name! + +" +transpose_76_perm_0*! +val + + + + + +z +const# +transpose_77_perm_0 + + +*) +name! + +" +transpose_77_perm_0*! +val + + + + + +� + transpose +x + + +var_1052 +perm + +transpose_77_perm_00 + transpose_115 +  + + +@ +�*# +name + +" + transpose_115� + transpose +x + + +var_1047 +perm + +transpose_76_perm_0/ + transpose_116 +  + + +{ +@*# +name + +" + transpose_116� +matmul +x + + transpose_116 +y + + transpose_115* + transpose_x + +scores_45_transpose_x_0* + transpose_y + +scores_45_transpose_y_0, + scores_45 +  + + +{ +�* +name + + " + scores_45� +add +x + + scores_45 +y + + position_bias, + scores_47 +  + + +{ +�* +name + + " + scores_47| +softmax +x + + scores_47 +axis + +var_9+ +var_1063 +  + + +{ +�* +name + + " +op_1063l +identity +x + + +var_1063, + input_185 +  + + +{ +�* +name + + " + input_185o +const +states_95_transpose_x_0 +*- +name% + +" +states_95_transpose_x_0* +val + + +o +const +states_95_transpose_y_0 +*- +name% + +" +states_95_transpose_y_0* +val + + +� + transpose +x + + +var_1057" +perm + +value_states_23_perm_00 + transpose_117 +  + + +� +@*# +name + +" + transpose_117� +matmul +x + + input_185 +y + + transpose_117* + transpose_x + +states_95_transpose_x_0* + transpose_y + +states_95_transpose_y_0+ + states_95 +  + + +{ +@* +name + + " + states_95q +const +var_1067_perm_0 + + +*$ +name + +" +op_1067_perm_0*! +val + + + + + +l +const +var_1069 + + +* +name + + " +op_1069** +val# + + + + + ����������� + transpose +x + + states_95 +perm + +var_1067_perm_0/ + transpose_114 +  + +{ + +@*# +name + +" + transpose_114� +reshape +x + + transpose_114 +shape + + +var_1069& + input_187 +  + +{ +�* +name + + " + input_187� +linear +x + + input_187D +weight: +8 +6model_decoder_block_2_layer_1_EncDecAttention_o_weight +bias + +states_1_bias_0& + input_189 +  + +{ +�* +name + + " + input_189� +add +x + +hidden_states_143 +y + + input_189. +hidden_states_151 +  + +{ +�*' +name + +" +hidden_states_151g +const +var_13_promoted_21 + *' +name + +" +op_13_promoted_21* +val +  + + + +@� +pow +x + +hidden_states_151 +y + +var_13_promoted_21% +var_1079 +  + +{ +�* +name + + " +op_1079i +const +var_1080 + + +* +name + + " +op_1080*' +val  + + + + + +���������� + reduce_mean +x + + +var_1079 +axes + + +var_1080 + keep_dims + + +var_19' + variance_43 +  + +{ +*! +name + +" + variance_43S +const +var_1082 + * +name + + " +op_1082* +val +  + + + +�7�5s +add +x + + variance_43 +y + + +var_1082$ +var_1083 +  + +{ +* +name + + " +op_1083g +const +var_1084_epsilon_0 + *' +name + +" +op_1084_epsilon_0* +val +  + + + +̼�+� +rsqrt +x + + +var_1083! +epsilon + +var_1084_epsilon_0$ +var_1084 +  + +{ +* +name + + " +op_1084� +mul +x + +hidden_states_151 +y + + +var_1084. +hidden_states_155 +  + +{ +�*' +name + +" +hidden_states_155� +mul8 +x3 +1 +/model_decoder_block_2_layer_2_layer_norm_weight +y + +hidden_states_155& + input_191 +  + +{ +�* +name + + " + input_191� +linear +x + + input_191D +weight: +8 +6model_decoder_block_2_layer_2_DenseReluDense_wi_weight +bias + +input_17_bias_0& + input_193 +  + +{ +�* +name + + " + input_193c +relu +x + + input_193& + input_195 +  + +{ +�* +name + + " + input_195� +linear +x + + input_195D +weight: +8 +6model_decoder_block_2_layer_2_DenseReluDense_wo_weight +bias + +states_1_bias_0& + input_199 +  + +{ +�* +name + + " + input_199� +add +x + +hidden_states_151 +y + + input_199. +hidden_states_157 +  + +{ +�*' +name + +" +hidden_states_157g +const +var_13_promoted_22 + *' +name + +" +op_13_promoted_22* +val +  + + + +@� +pow +x + +hidden_states_157 +y + +var_13_promoted_22% +var_1110 +  + +{ +�* +name + + " +op_1110i +const +var_1111 + + +* +name + + " +op_1111*' +val  + + + + + +���������� + reduce_mean +x + + +var_1110 +axes + + +var_1111 + keep_dims + + +var_19' + variance_45 +  + +{ +*! +name + +" + variance_45S +const +var_1113 + * +name + + " +op_1113* +val +  + + + +�7�5s +add +x + + variance_45 +y + + +var_1113$ +var_1114 +  + +{ +* +name + + " +op_1114g +const +var_1115_epsilon_0 + *' +name + +" +op_1115_epsilon_0* +val +  + + + +̼�+� +rsqrt +x + + +var_1114! +epsilon + +var_1115_epsilon_0$ +var_1115 +  + +{ +* +name + + " +op_1115� +mul +x + +hidden_states_157 +y + + +var_1115. +hidden_states_161 +  + +{ +�*' +name + +" +hidden_states_161� +mul8 +x3 +1 +/model_decoder_block_3_layer_0_layer_norm_weight +y + +hidden_states_161. +hidden_states_163 +  + +{ +�*' +name + +" +hidden_states_163� +linear +x + +hidden_states_163B +weight8 +6 +4model_decoder_block_3_layer_0_SelfAttention_q_weight +bias + +states_1_bias_0& + states_97 +  + +{ +�* +name + + " + states_97l +const +var_1128 + + +* +name + + " +op_1128** +val# + + + + + ���������@ +reshape +x + + states_97 +shape + + +var_1128* +var_1129 +  + +{ + +@* +name + + " +op_1129� +linear +x + +hidden_states_163B +weight8 +6 +4model_decoder_block_3_layer_0_SelfAttention_k_weight +bias + +states_1_bias_0& + states_99 +  + +{ +�* +name + + " + states_99l +const +var_1133 + + +* +name + + " +op_1133** +val# + + + + + ���������@ +reshape +x + + states_99 +shape + + +var_1133* +var_1134 +  + +{ + +@* +name + + " +op_1134� +linear +x + +hidden_states_163B +weight8 +6 +4model_decoder_block_3_layer_0_SelfAttention_v_weight +bias + +states_1_bias_0' + +states_101 +  + +{ +�* +name + +" + +states_101l +const +var_1138 + + +* +name + + " +op_1138** +val# + + + + + ���������@� +reshape +x + + +states_101 +shape + + +var_1138* +var_1139 +  + +{ + +@* +name + + " +op_1139� +const& +value_states_25_perm_0 + + +*, +name$ + +" +value_states_25_perm_0*! +val + + + + + +o +const +scores_49_transpose_x_0 +*- +name% + +" +scores_49_transpose_x_0* +val + + +o +const +scores_49_transpose_y_0 +*- +name% + +" +scores_49_transpose_y_0* +val + + +z +const# +transpose_78_perm_0 + + +*) +name! + +" +transpose_78_perm_0*! +val + + + + + +z +const# +transpose_79_perm_0 + + +*) +name! + +" +transpose_79_perm_0*! +val + + + + + +� + transpose +x + + +var_1134 +perm + +transpose_79_perm_0/ + transpose_111 +  + + +@ +{*# +name + +" + transpose_111� + transpose +x + + +var_1129 +perm + +transpose_78_perm_0/ + transpose_112 +  + + +{ +@*# +name + +" + transpose_112� +matmul +x + + transpose_112 +y + + transpose_111* + transpose_x + +scores_49_transpose_x_0* + transpose_y + +scores_49_transpose_y_0+ + scores_49 +  + + +{ +{* +name + + " + scores_49� +add +x + + scores_49 +y + +position_bias_7+ + scores_51 +  + + +{ +{* +name + + " + scores_51{ +softmax +x + + scores_51 +axis + +var_9* +var_1145 +  + + +{ +{* +name + + " +op_1145k +identity +x + + +var_1145+ + input_203 +  + + +{ +{* +name + + " + input_203q +const +states_103_transpose_x_0 +*. +name& + +" +states_103_transpose_x_0* +val + + +q +const +states_103_transpose_y_0 +*. +name& + +" +states_103_transpose_y_0* +val + + +� + transpose +x + + +var_1139" +perm + +value_states_25_perm_0/ + transpose_113 +  + + +{ +@*# +name + +" + transpose_113� +matmul +x + + input_203 +y + + transpose_113+ + transpose_x + +states_103_transpose_x_0+ + transpose_y + +states_103_transpose_y_0, + +states_103 +  + + +{ +@* +name + +" + +states_103q +const +var_1149_perm_0 + + +*$ +name + +" +op_1149_perm_0*! +val + + + + + +l +const +var_1151 + + +* +name + + " +op_1151** +val# + + + + + ����������� + transpose +x + + +states_103 +perm + +var_1149_perm_0/ + transpose_110 +  + +{ + +@*# +name + +" + transpose_110� +reshape +x + + transpose_110 +shape + + +var_1151& + input_205 +  + +{ +�* +name + + " + input_205� +linear +x + + input_205B +weight8 +6 +4model_decoder_block_3_layer_0_SelfAttention_o_weight +bias + +states_1_bias_0& + input_207 +  + +{ +�* +name + + " + input_207� +add +x + +hidden_states_157 +y + + input_207. +hidden_states_165 +  + +{ +�*' +name + +" +hidden_states_165g +const +var_13_promoted_23 + *' +name + +" +op_13_promoted_23* +val +  + + + +@� +pow +x + +hidden_states_165 +y + +var_13_promoted_23% +var_1161 +  + +{ +�* +name + + " +op_1161i +const +var_1162 + + +* +name + + " +op_1162*' +val  + + + + + +���������� + reduce_mean +x + + +var_1161 +axes + + +var_1162 + keep_dims + + +var_19' + variance_47 +  + +{ +*! +name + +" + variance_47S +const +var_1164 + * +name + + " +op_1164* +val +  + + + +�7�5s +add +x + + variance_47 +y + + +var_1164$ +var_1165 +  + +{ +* +name + + " +op_1165g +const +var_1166_epsilon_0 + *' +name + +" +op_1166_epsilon_0* +val +  + + + +̼�+� +rsqrt +x + + +var_1165! +epsilon + +var_1166_epsilon_0$ +var_1166 +  + +{ +* +name + + " +op_1166� +mul +x + +hidden_states_165 +y + + +var_1166. +hidden_states_169 +  + +{ +�*' +name + +" +hidden_states_169� +mul8 +x3 +1 +/model_decoder_block_3_layer_1_layer_norm_weight +y + +hidden_states_169. +hidden_states_171 +  + +{ +�*' +name + +" +hidden_states_171� +linear +x + +hidden_states_171D +weight: +8 +6model_decoder_block_3_layer_1_EncDecAttention_q_weight +bias + +states_1_bias_0' + +states_105 +  + +{ +�* +name + +" + +states_105l +const +var_1179 + + +* +name + + " +op_1179** +val# + + + + + ���������@� +reshape +x + + +states_105 +shape + + +var_1179* +var_1180 +  + +{ + +@* +name + + " +op_1180� +linear +x + + input_115D +weight: +8 +6model_decoder_block_3_layer_1_EncDecAttention_k_weight +bias + +states_1_bias_0( + +states_107 +  + +� +�* +name + +" + +states_107l +const +var_1184 + + +* +name + + " +op_1184** +val# + + + + + ���������@� +reshape +x + + +states_107 +shape + + +var_1184+ +var_1185 +  + +� + +@* +name + + " +op_1185� +linear +x + + input_115D +weight: +8 +6model_decoder_block_3_layer_1_EncDecAttention_v_weight +bias + +states_1_bias_0( + +states_109 +  + +� +�* +name + +" + +states_109l +const +var_1189 + + +* +name + + " +op_1189** +val# + + + + + ���������@� +reshape +x + + +states_109 +shape + + +var_1189+ +var_1190 +  + +� + +@* +name + + " +op_1190� +const& +value_states_27_perm_0 + + +*, +name$ + +" +value_states_27_perm_0*! +val + + + + + +o +const +scores_53_transpose_x_0 +*- +name% + +" +scores_53_transpose_x_0* +val + + +o +const +scores_53_transpose_y_0 +*- +name% + +" +scores_53_transpose_y_0* +val + + +z +const# +transpose_80_perm_0 + + +*) +name! + +" +transpose_80_perm_0*! +val + + + + + +z +const# +transpose_81_perm_0 + + +*) +name! + +" +transpose_81_perm_0*! +val + + + + + +� + transpose +x + + +var_1185 +perm + +transpose_81_perm_00 + transpose_107 +  + + +@ +�*# +name + +" + transpose_107� + transpose +x + + +var_1180 +perm + +transpose_80_perm_0/ + transpose_108 +  + + +{ +@*# +name + +" + transpose_108� +matmul +x + + transpose_108 +y + + transpose_107* + transpose_x + +scores_53_transpose_x_0* + transpose_y + +scores_53_transpose_y_0, + scores_53 +  + + +{ +�* +name + + " + scores_53� +add +x + + scores_53 +y + + position_bias, + scores_55 +  + + +{ +�* +name + + " + scores_55| +softmax +x + + scores_55 +axis + +var_9+ +var_1196 +  + + +{ +�* +name + + " +op_1196l +identity +x + + +var_1196, + input_211 +  + + +{ +�* +name + + " + input_211q +const +states_111_transpose_x_0 +*. +name& + +" +states_111_transpose_x_0* +val + + +q +const +states_111_transpose_y_0 +*. +name& + +" +states_111_transpose_y_0* +val + + +� + transpose +x + + +var_1190" +perm + +value_states_27_perm_00 + transpose_109 +  + + +� +@*# +name + +" + transpose_109� +matmul +x + + input_211 +y + + transpose_109+ + transpose_x + +states_111_transpose_x_0+ + transpose_y + +states_111_transpose_y_0, + +states_111 +  + + +{ +@* +name + +" + +states_111q +const +var_1200_perm_0 + + +*$ +name + +" +op_1200_perm_0*! +val + + + + + +l +const +var_1202 + + +* +name + + " +op_1202** +val# + + + + + ����������� + transpose +x + + +states_111 +perm + +var_1200_perm_0/ + transpose_106 +  + +{ + +@*# +name + +" + transpose_106� +reshape +x + + transpose_106 +shape + + +var_1202& + input_213 +  + +{ +�* +name + + " + input_213� +linear +x + + input_213D +weight: +8 +6model_decoder_block_3_layer_1_EncDecAttention_o_weight +bias + +states_1_bias_0& + input_215 +  + +{ +�* +name + + " + input_215� +add +x + +hidden_states_165 +y + + input_215. +hidden_states_173 +  + +{ +�*' +name + +" +hidden_states_173g +const +var_13_promoted_24 + *' +name + +" +op_13_promoted_24* +val +  + + + +@� +pow +x + +hidden_states_173 +y + +var_13_promoted_24% +var_1212 +  + +{ +�* +name + + " +op_1212i +const +var_1213 + + +* +name + + " +op_1213*' +val  + + + + + +���������� + reduce_mean +x + + +var_1212 +axes + + +var_1213 + keep_dims + + +var_19' + variance_49 +  + +{ +*! +name + +" + variance_49S +const +var_1215 + * +name + + " +op_1215* +val +  + + + +�7�5s +add +x + + variance_49 +y + + +var_1215$ +var_1216 +  + +{ +* +name + + " +op_1216g +const +var_1217_epsilon_0 + *' +name + +" +op_1217_epsilon_0* +val +  + + + +̼�+� +rsqrt +x + + +var_1216! +epsilon + +var_1217_epsilon_0$ +var_1217 +  + +{ +* +name + + " +op_1217� +mul +x + +hidden_states_173 +y + + +var_1217. +hidden_states_177 +  + +{ +�*' +name + +" +hidden_states_177� +mul8 +x3 +1 +/model_decoder_block_3_layer_2_layer_norm_weight +y + +hidden_states_177& + input_217 +  + +{ +�* +name + + " + input_217� +linear +x + + input_217D +weight: +8 +6model_decoder_block_3_layer_2_DenseReluDense_wi_weight +bias + +input_17_bias_0& + input_219 +  + +{ +�* +name + + " + input_219c +relu +x + + input_219& + input_221 +  + +{ +�* +name + + " + input_221� +linear +x + + input_221D +weight: +8 +6model_decoder_block_3_layer_2_DenseReluDense_wo_weight +bias + +states_1_bias_0& + input_225 +  + +{ +�* +name + + " + input_225� +add +x + +hidden_states_173 +y + + input_225. +hidden_states_179 +  + +{ +�*' +name + +" +hidden_states_179g +const +var_13_promoted_25 + *' +name + +" +op_13_promoted_25* +val +  + + + +@� +pow +x + +hidden_states_179 +y + +var_13_promoted_25% +var_1243 +  + +{ +�* +name + + " +op_1243i +const +var_1244 + + +* +name + + " +op_1244*' +val  + + + + + +���������� + reduce_mean +x + + +var_1243 +axes + + +var_1244 + keep_dims + + +var_19' + variance_51 +  + +{ +*! +name + +" + variance_51S +const +var_1246 + * +name + + " +op_1246* +val +  + + + +�7�5s +add +x + + variance_51 +y + + +var_1246$ +var_1247 +  + +{ +* +name + + " +op_1247g +const +var_1248_epsilon_0 + *' +name + +" +op_1248_epsilon_0* +val +  + + + +̼�+� +rsqrt +x + + +var_1247! +epsilon + +var_1248_epsilon_0$ +var_1248 +  + +{ +* +name + + " +op_1248� +mul +x + +hidden_states_179 +y + + +var_1248. +hidden_states_183 +  + +{ +�*' +name + +" +hidden_states_183� +mul8 +x3 +1 +/model_decoder_block_4_layer_0_layer_norm_weight +y + +hidden_states_183. +hidden_states_185 +  + +{ +�*' +name + +" +hidden_states_185� +linear +x + +hidden_states_185B +weight8 +6 +4model_decoder_block_4_layer_0_SelfAttention_q_weight +bias + +states_1_bias_0' + +states_113 +  + +{ +�* +name + +" + +states_113l +const +var_1261 + + +* +name + + " +op_1261** +val# + + + + + ���������@� +reshape +x + + +states_113 +shape + + +var_1261* +var_1262 +  + +{ + +@* +name + + " +op_1262� +linear +x + +hidden_states_185B +weight8 +6 +4model_decoder_block_4_layer_0_SelfAttention_k_weight +bias + +states_1_bias_0' + +states_115 +  + +{ +�* +name + +" + +states_115l +const +var_1266 + + +* +name + + " +op_1266** +val# + + + + + ���������@� +reshape +x + + +states_115 +shape + + +var_1266* +var_1267 +  + +{ + +@* +name + + " +op_1267� +linear +x + +hidden_states_185B +weight8 +6 +4model_decoder_block_4_layer_0_SelfAttention_v_weight +bias + +states_1_bias_0' + +states_117 +  + +{ +�* +name + +" + +states_117l +const +var_1271 + + +* +name + + " +op_1271** +val# + + + + + ���������@� +reshape +x + + +states_117 +shape + + +var_1271* +var_1272 +  + +{ + +@* +name + + " +op_1272� +const& +value_states_29_perm_0 + + +*, +name$ + +" +value_states_29_perm_0*! +val + + + + + +o +const +scores_57_transpose_x_0 +*- +name% + +" +scores_57_transpose_x_0* +val + + +o +const +scores_57_transpose_y_0 +*- +name% + +" +scores_57_transpose_y_0* +val + + +z +const# +transpose_82_perm_0 + + +*) +name! + +" +transpose_82_perm_0*! +val + + + + + +z +const# +transpose_83_perm_0 + + +*) +name! + +" +transpose_83_perm_0*! +val + + + + + +� + transpose +x + + +var_1267 +perm + +transpose_83_perm_0/ + transpose_103 +  + + +@ +{*# +name + +" + transpose_103� + transpose +x + + +var_1262 +perm + +transpose_82_perm_0/ + transpose_104 +  + + +{ +@*# +name + +" + transpose_104� +matmul +x + + transpose_104 +y + + transpose_103* + transpose_x + +scores_57_transpose_x_0* + transpose_y + +scores_57_transpose_y_0+ + scores_57 +  + + +{ +{* +name + + " + scores_57� +add +x + + scores_57 +y + +position_bias_7+ + scores_59 +  + + +{ +{* +name + + " + scores_59{ +softmax +x + + scores_59 +axis + +var_9* +var_1278 +  + + +{ +{* +name + + " +op_1278k +identity +x + + +var_1278+ + input_229 +  + + +{ +{* +name + + " + input_229q +const +states_119_transpose_x_0 +*. +name& + +" +states_119_transpose_x_0* +val + + +q +const +states_119_transpose_y_0 +*. +name& + +" +states_119_transpose_y_0* +val + + +� + transpose +x + + +var_1272" +perm + +value_states_29_perm_0/ + transpose_105 +  + + +{ +@*# +name + +" + transpose_105� +matmul +x + + input_229 +y + + transpose_105+ + transpose_x + +states_119_transpose_x_0+ + transpose_y + +states_119_transpose_y_0, + +states_119 +  + + +{ +@* +name + +" + +states_119q +const +var_1282_perm_0 + + +*$ +name + +" +op_1282_perm_0*! +val + + + + + +l +const +var_1284 + + +* +name + + " +op_1284** +val# + + + + + ����������� + transpose +x + + +states_119 +perm + +var_1282_perm_0/ + transpose_102 +  + +{ + +@*# +name + +" + transpose_102� +reshape +x + + transpose_102 +shape + + +var_1284& + input_231 +  + +{ +�* +name + + " + input_231� +linear +x + + input_231B +weight8 +6 +4model_decoder_block_4_layer_0_SelfAttention_o_weight +bias + +states_1_bias_0& + input_233 +  + +{ +�* +name + + " + input_233� +add +x + +hidden_states_179 +y + + input_233. +hidden_states_187 +  + +{ +�*' +name + +" +hidden_states_187g +const +var_13_promoted_26 + *' +name + +" +op_13_promoted_26* +val +  + + + +@� +pow +x + +hidden_states_187 +y + +var_13_promoted_26% +var_1294 +  + +{ +�* +name + + " +op_1294i +const +var_1295 + + +* +name + + " +op_1295*' +val  + + + + + +���������� + reduce_mean +x + + +var_1294 +axes + + +var_1295 + keep_dims + + +var_19' + variance_53 +  + +{ +*! +name + +" + variance_53S +const +var_1297 + * +name + + " +op_1297* +val +  + + + +�7�5s +add +x + + variance_53 +y + + +var_1297$ +var_1298 +  + +{ +* +name + + " +op_1298g +const +var_1299_epsilon_0 + *' +name + +" +op_1299_epsilon_0* +val +  + + + +̼�+� +rsqrt +x + + +var_1298! +epsilon + +var_1299_epsilon_0$ +var_1299 +  + +{ +* +name + + " +op_1299� +mul +x + +hidden_states_187 +y + + +var_1299. +hidden_states_191 +  + +{ +�*' +name + +" +hidden_states_191� +mul8 +x3 +1 +/model_decoder_block_4_layer_1_layer_norm_weight +y + +hidden_states_191. +hidden_states_193 +  + +{ +�*' +name + +" +hidden_states_193� +linear +x + +hidden_states_193D +weight: +8 +6model_decoder_block_4_layer_1_EncDecAttention_q_weight +bias + +states_1_bias_0' + +states_121 +  + +{ +�* +name + +" + +states_121l +const +var_1312 + + +* +name + + " +op_1312** +val# + + + + + ���������@� +reshape +x + + +states_121 +shape + + +var_1312* +var_1313 +  + +{ + +@* +name + + " +op_1313� +linear +x + + input_115D +weight: +8 +6model_decoder_block_4_layer_1_EncDecAttention_k_weight +bias + +states_1_bias_0( + +states_123 +  + +� +�* +name + +" + +states_123l +const +var_1317 + + +* +name + + " +op_1317** +val# + + + + + ���������@� +reshape +x + + +states_123 +shape + + +var_1317+ +var_1318 +  + +� + +@* +name + + " +op_1318� +linear +x + + input_115D +weight: +8 +6model_decoder_block_4_layer_1_EncDecAttention_v_weight +bias + +states_1_bias_0( + +states_125 +  + +� +�* +name + +" + +states_125l +const +var_1322 + + +* +name + + " +op_1322** +val# + + + + + ���������@� +reshape +x + + +states_125 +shape + + +var_1322+ +var_1323 +  + +� + +@* +name + + " +op_1323� +const& +value_states_31_perm_0 + + +*, +name$ + +" +value_states_31_perm_0*! +val + + + + + +o +const +scores_61_transpose_x_0 +*- +name% + +" +scores_61_transpose_x_0* +val + + +o +const +scores_61_transpose_y_0 +*- +name% + +" +scores_61_transpose_y_0* +val + + +z +const# +transpose_84_perm_0 + + +*) +name! + +" +transpose_84_perm_0*! +val + + + + + +z +const# +transpose_85_perm_0 + + +*) +name! + +" +transpose_85_perm_0*! +val + + + + + +� + transpose +x + + +var_1318 +perm + +transpose_85_perm_0/ + transpose_99 +  + + +@ +�*" +name + +" + transpose_99� + transpose +x + + +var_1313 +perm + +transpose_84_perm_0/ + transpose_100 +  + + +{ +@*# +name + +" + transpose_100� +matmul +x + + transpose_100 +y + + transpose_99* + transpose_x + +scores_61_transpose_x_0* + transpose_y + +scores_61_transpose_y_0, + scores_61 +  + + +{ +�* +name + + " + scores_61� +add +x + + scores_61 +y + + position_bias, + scores_63 +  + + +{ +�* +name + + " + scores_63| +softmax +x + + scores_63 +axis + +var_9+ +var_1329 +  + + +{ +�* +name + + " +op_1329l +identity +x + + +var_1329, + input_237 +  + + +{ +�* +name + + " + input_237q +const +states_127_transpose_x_0 +*. +name& + +" +states_127_transpose_x_0* +val + + +q +const +states_127_transpose_y_0 +*. +name& + +" +states_127_transpose_y_0* +val + + +� + transpose +x + + +var_1323" +perm + +value_states_31_perm_00 + transpose_101 +  + + +� +@*# +name + +" + transpose_101� +matmul +x + + input_237 +y + + transpose_101+ + transpose_x + +states_127_transpose_x_0+ + transpose_y + +states_127_transpose_y_0, + +states_127 +  + + +{ +@* +name + +" + +states_127q +const +var_1333_perm_0 + + +*$ +name + +" +op_1333_perm_0*! +val + + + + + +l +const +var_1335 + + +* +name + + " +op_1335** +val# + + + + + ����������� + transpose +x + + +states_127 +perm + +var_1333_perm_0. + transpose_98 +  + +{ + +@*" +name + +" + transpose_98� +reshape +x + + transpose_98 +shape + + +var_1335& + input_239 +  + +{ +�* +name + + " + input_239� +linear +x + + input_239D +weight: +8 +6model_decoder_block_4_layer_1_EncDecAttention_o_weight +bias + +states_1_bias_0& + input_241 +  + +{ +�* +name + + " + input_241� +add +x + +hidden_states_187 +y + + input_241. +hidden_states_195 +  + +{ +�*' +name + +" +hidden_states_195g +const +var_13_promoted_27 + *' +name + +" +op_13_promoted_27* +val +  + + + +@� +pow +x + +hidden_states_195 +y + +var_13_promoted_27% +var_1345 +  + +{ +�* +name + + " +op_1345i +const +var_1346 + + +* +name + + " +op_1346*' +val  + + + + + +���������� + reduce_mean +x + + +var_1345 +axes + + +var_1346 + keep_dims + + +var_19' + variance_55 +  + +{ +*! +name + +" + variance_55S +const +var_1348 + * +name + + " +op_1348* +val +  + + + +�7�5s +add +x + + variance_55 +y + + +var_1348$ +var_1349 +  + +{ +* +name + + " +op_1349g +const +var_1350_epsilon_0 + *' +name + +" +op_1350_epsilon_0* +val +  + + + +̼�+� +rsqrt +x + + +var_1349! +epsilon + +var_1350_epsilon_0$ +var_1350 +  + +{ +* +name + + " +op_1350� +mul +x + +hidden_states_195 +y + + +var_1350. +hidden_states_199 +  + +{ +�*' +name + +" +hidden_states_199� +mul8 +x3 +1 +/model_decoder_block_4_layer_2_layer_norm_weight +y + +hidden_states_199& + input_243 +  + +{ +�* +name + + " + input_243� +linear +x + + input_243D +weight: +8 +6model_decoder_block_4_layer_2_DenseReluDense_wi_weight +bias + +input_17_bias_0& + input_245 +  + +{ +�* +name + + " + input_245c +relu +x + + input_245& + input_247 +  + +{ +�* +name + + " + input_247� +linear +x + + input_247D +weight: +8 +6model_decoder_block_4_layer_2_DenseReluDense_wo_weight +bias + +states_1_bias_0& + input_251 +  + +{ +�* +name + + " + input_251� +add +x + +hidden_states_195 +y + + input_251. +hidden_states_201 +  + +{ +�*' +name + +" +hidden_states_201g +const +var_13_promoted_28 + *' +name + +" +op_13_promoted_28* +val +  + + + +@� +pow +x + +hidden_states_201 +y + +var_13_promoted_28% +var_1376 +  + +{ +�* +name + + " +op_1376i +const +var_1377 + + +* +name + + " +op_1377*' +val  + + + + + +���������� + reduce_mean +x + + +var_1376 +axes + + +var_1377 + keep_dims + + +var_19' + variance_57 +  + +{ +*! +name + +" + variance_57S +const +var_1379 + * +name + + " +op_1379* +val +  + + + +�7�5s +add +x + + variance_57 +y + + +var_1379$ +var_1380 +  + +{ +* +name + + " +op_1380g +const +var_1381_epsilon_0 + *' +name + +" +op_1381_epsilon_0* +val +  + + + +̼�+� +rsqrt +x + + +var_1380! +epsilon + +var_1381_epsilon_0$ +var_1381 +  + +{ +* +name + + " +op_1381� +mul +x + +hidden_states_201 +y + + +var_1381. +hidden_states_205 +  + +{ +�*' +name + +" +hidden_states_205� +mul8 +x3 +1 +/model_decoder_block_5_layer_0_layer_norm_weight +y + +hidden_states_205. +hidden_states_207 +  + +{ +�*' +name + +" +hidden_states_207� +linear +x + +hidden_states_207B +weight8 +6 +4model_decoder_block_5_layer_0_SelfAttention_q_weight +bias + +states_1_bias_0' + +states_129 +  + +{ +�* +name + +" + +states_129l +const +var_1394 + + +* +name + + " +op_1394** +val# + + + + + ���������@� +reshape +x + + +states_129 +shape + + +var_1394* +var_1395 +  + +{ + +@* +name + + " +op_1395� +linear +x + +hidden_states_207B +weight8 +6 +4model_decoder_block_5_layer_0_SelfAttention_k_weight +bias + +states_1_bias_0' + +states_131 +  + +{ +�* +name + +" + +states_131l +const +var_1399 + + +* +name + + " +op_1399** +val# + + + + + ���������@� +reshape +x + + +states_131 +shape + + +var_1399* +var_1400 +  + +{ + +@* +name + + " +op_1400� +linear +x + +hidden_states_207B +weight8 +6 +4model_decoder_block_5_layer_0_SelfAttention_v_weight +bias + +states_1_bias_0' + +states_133 +  + +{ +�* +name + +" + +states_133l +const +var_1404 + + +* +name + + " +op_1404** +val# + + + + + ���������@� +reshape +x + + +states_133 +shape + + +var_1404* +var_1405 +  + +{ + +@* +name + + " +op_1405� +const& +value_states_33_perm_0 + + +*, +name$ + +" +value_states_33_perm_0*! +val + + + + + +o +const +scores_65_transpose_x_0 +*- +name% + +" +scores_65_transpose_x_0* +val + + +o +const +scores_65_transpose_y_0 +*- +name% + +" +scores_65_transpose_y_0* +val + + +z +const# +transpose_86_perm_0 + + +*) +name! + +" +transpose_86_perm_0*! +val + + + + + +z +const# +transpose_87_perm_0 + + +*) +name! + +" +transpose_87_perm_0*! +val + + + + + +� + transpose +x + + +var_1400 +perm + +transpose_87_perm_0. + transpose_95 +  + + +@ +{*" +name + +" + transpose_95� + transpose +x + + +var_1395 +perm + +transpose_86_perm_0. + transpose_96 +  + + +{ +@*" +name + +" + transpose_96� +matmul +x + + transpose_96 +y + + transpose_95* + transpose_x + +scores_65_transpose_x_0* + transpose_y + +scores_65_transpose_y_0+ + scores_65 +  + + +{ +{* +name + + " + scores_65� +add +x + + scores_65 +y + +position_bias_7+ + scores_67 +  + + +{ +{* +name + + " + scores_67{ +softmax +x + + scores_67 +axis + +var_9* +var_1411 +  + + +{ +{* +name + + " +op_1411k +identity +x + + +var_1411+ + input_255 +  + + +{ +{* +name + + " + input_255q +const +states_135_transpose_x_0 +*. +name& + +" +states_135_transpose_x_0* +val + + +q +const +states_135_transpose_y_0 +*. +name& + +" +states_135_transpose_y_0* +val + + +� + transpose +x + + +var_1405" +perm + +value_states_33_perm_0. + transpose_97 +  + + +{ +@*" +name + +" + transpose_97� +matmul +x + + input_255 +y + + transpose_97+ + transpose_x + +states_135_transpose_x_0+ + transpose_y + +states_135_transpose_y_0, + +states_135 +  + + +{ +@* +name + +" + +states_135q +const +var_1415_perm_0 + + +*$ +name + +" +op_1415_perm_0*! +val + + + + + +l +const +var_1417 + + +* +name + + " +op_1417** +val# + + + + + ����������� + transpose +x + + +states_135 +perm + +var_1415_perm_0. + transpose_94 +  + +{ + +@*" +name + +" + transpose_94� +reshape +x + + transpose_94 +shape + + +var_1417& + input_257 +  + +{ +�* +name + + " + input_257� +linear +x + + input_257B +weight8 +6 +4model_decoder_block_5_layer_0_SelfAttention_o_weight +bias + +states_1_bias_0& + input_259 +  + +{ +�* +name + + " + input_259� +add +x + +hidden_states_201 +y + + input_259. +hidden_states_209 +  + +{ +�*' +name + +" +hidden_states_209g +const +var_13_promoted_29 + *' +name + +" +op_13_promoted_29* +val +  + + + +@� +pow +x + +hidden_states_209 +y + +var_13_promoted_29% +var_1427 +  + +{ +�* +name + + " +op_1427i +const +var_1428 + + +* +name + + " +op_1428*' +val  + + + + + +���������� + reduce_mean +x + + +var_1427 +axes + + +var_1428 + keep_dims + + +var_19' + variance_59 +  + +{ +*! +name + +" + variance_59S +const +var_1430 + * +name + + " +op_1430* +val +  + + + +�7�5s +add +x + + variance_59 +y + + +var_1430$ +var_1431 +  + +{ +* +name + + " +op_1431g +const +var_1432_epsilon_0 + *' +name + +" +op_1432_epsilon_0* +val +  + + + +̼�+� +rsqrt +x + + +var_1431! +epsilon + +var_1432_epsilon_0$ +var_1432 +  + +{ +* +name + + " +op_1432� +mul +x + +hidden_states_209 +y + + +var_1432. +hidden_states_213 +  + +{ +�*' +name + +" +hidden_states_213� +mul8 +x3 +1 +/model_decoder_block_5_layer_1_layer_norm_weight +y + +hidden_states_213. +hidden_states_215 +  + +{ +�*' +name + +" +hidden_states_215� +linear +x + +hidden_states_215D +weight: +8 +6model_decoder_block_5_layer_1_EncDecAttention_q_weight +bias + +states_1_bias_0' + +states_137 +  + +{ +�* +name + +" + +states_137l +const +var_1445 + + +* +name + + " +op_1445** +val# + + + + + ���������@� +reshape +x + + +states_137 +shape + + +var_1445* +var_1446 +  + +{ + +@* +name + + " +op_1446� +linear +x + + input_115D +weight: +8 +6model_decoder_block_5_layer_1_EncDecAttention_k_weight +bias + +states_1_bias_0( + +states_139 +  + +� +�* +name + +" + +states_139l +const +var_1450 + + +* +name + + " +op_1450** +val# + + + + + ���������@� +reshape +x + + +states_139 +shape + + +var_1450+ +var_1451 +  + +� + +@* +name + + " +op_1451� +linear +x + + input_115D +weight: +8 +6model_decoder_block_5_layer_1_EncDecAttention_v_weight +bias + +states_1_bias_0( + +states_141 +  + +� +�* +name + +" + +states_141l +const +var_1455 + + +* +name + + " +op_1455** +val# + + + + + ���������@� +reshape +x + + +states_141 +shape + + +var_1455+ +var_1456 +  + +� + +@* +name + + " +op_1456z +const# +value_states_perm_0 + + +*) +name! + +" +value_states_perm_0*! +val + + + + + +o +const +scores_69_transpose_x_0 +*- +name% + +" +scores_69_transpose_x_0* +val + + +o +const +scores_69_transpose_y_0 +*- +name% + +" +scores_69_transpose_y_0* +val + + +z +const# +transpose_88_perm_0 + + +*) +name! + +" +transpose_88_perm_0*! +val + + + + + +z +const# +transpose_89_perm_0 + + +*) +name! + +" +transpose_89_perm_0*! +val + + + + + +� + transpose +x + + +var_1451 +perm + +transpose_89_perm_0/ + transpose_91 +  + + +@ +�*" +name + +" + transpose_91� + transpose +x + + +var_1446 +perm + +transpose_88_perm_0. + transpose_92 +  + + +{ +@*" +name + +" + transpose_92� +matmul +x + + transpose_92 +y + + transpose_91* + transpose_x + +scores_69_transpose_x_0* + transpose_y + +scores_69_transpose_y_0, + scores_69 +  + + +{ +�* +name + + " + scores_69z +add +x + + scores_69 +y + + position_bias) +scores +  + + +{ +�* +name + + +" +scoresy +softmax +x + + +scores +axis + +var_9+ +var_1462 +  + + +{ +�* +name + + " +op_1462l +identity +x + + +var_1462, + input_263 +  + + +{ +�* +name + + " + input_263i +const +states_transpose_x_0 +** +name" + +" +states_transpose_x_0* +val + + +i +const +states_transpose_y_0 +** +name" + +" +states_transpose_y_0* +val + + +� + transpose +x + + +var_1456 +perm + +value_states_perm_0/ + transpose_93 +  + + +� +@*" +name + +" + transpose_93� +matmul +x + + input_263 +y + + transpose_93' + transpose_x + +states_transpose_x_0' + transpose_y + +states_transpose_y_0( +states +  + + +{ +@* +name + + +" +statesq +const +var_1466_perm_0 + + +*$ +name + +" +op_1466_perm_0*! +val + + + + + +l +const +var_1468 + + +* +name + + " +op_1468** +val# + + + + + ����������� + transpose +x + + +states +perm + +var_1466_perm_0. + transpose_90 +  + +{ + +@*" +name + +" + transpose_90� +reshape +x + + transpose_90 +shape + + +var_1468& + input_265 +  + +{ +�* +name + + " + input_265� +linear +x + + input_265D +weight: +8 +6model_decoder_block_5_layer_1_EncDecAttention_o_weight +bias + +states_1_bias_0& + input_267 +  + +{ +�* +name + + " + input_267� +add +x + +hidden_states_209 +y + + input_267. +hidden_states_217 +  + +{ +�*' +name + +" +hidden_states_217g +const +var_13_promoted_30 + *' +name + +" +op_13_promoted_30* +val +  + + + +@� +pow +x + +hidden_states_217 +y + +var_13_promoted_30% +var_1478 +  + +{ +�* +name + + " +op_1478i +const +var_1479 + + +* +name + + " +op_1479*' +val  + + + + + +���������� + reduce_mean +x + + +var_1478 +axes + + +var_1479 + keep_dims + + +var_19' + variance_61 +  + +{ +*! +name + +" + variance_61S +const +var_1481 + * +name + + " +op_1481* +val +  + + + +�7�5s +add +x + + variance_61 +y + + +var_1481$ +var_1482 +  + +{ +* +name + + " +op_1482g +const +var_1483_epsilon_0 + *' +name + +" +op_1483_epsilon_0* +val +  + + + +̼�+� +rsqrt +x + + +var_1482! +epsilon + +var_1483_epsilon_0$ +var_1483 +  + +{ +* +name + + " +op_1483� +mul +x + +hidden_states_217 +y + + +var_1483. +hidden_states_221 +  + +{ +�*' +name + +" +hidden_states_221� +mul8 +x3 +1 +/model_decoder_block_5_layer_2_layer_norm_weight +y + +hidden_states_221& + input_269 +  + +{ +�* +name + + " + input_269� +linear +x + + input_269D +weight: +8 +6model_decoder_block_5_layer_2_DenseReluDense_wi_weight +bias + +input_17_bias_0& + input_271 +  + +{ +�* +name + + " + input_271c +relu +x + + input_271& + input_273 +  + +{ +�* +name + + " + input_273� +linear +x + + input_273D +weight: +8 +6model_decoder_block_5_layer_2_DenseReluDense_wo_weight +bias + +states_1_bias_0& + input_277 +  + +{ +�* +name + + " + input_277� +add +x + +hidden_states_217 +y + + input_277. +hidden_states_223 +  + +{ +�*' +name + +" +hidden_states_223g +const +var_13_promoted_31 + *' +name + +" +op_13_promoted_31* +val +  + + + +@� +pow +x + +hidden_states_223 +y + +var_13_promoted_31% +var_1501 +  + +{ +�* +name + + " +op_1501i +const +var_1502 + + +* +name + + " +op_1502*' +val  + + + + + +���������� + reduce_mean +x + + +var_1501 +axes + + +var_1502 + keep_dims + + +var_19$ +variance +  + +{ +* +name + + " + +varianceS +const +var_1504 + * +name + + " +op_1504* +val +  + + + +�7�5p +add +x + + +variance +y + + +var_1504$ +var_1505 +  + +{ +* +name + + " +op_1505g +const +var_1506_epsilon_0 + *' +name + +" +op_1506_epsilon_0* +val +  + + + +̼�+� +rsqrt +x + + +var_1505! +epsilon + +var_1506_epsilon_0$ +var_1506 +  + +{ +* +name + + " +op_1506� +mul +x + +hidden_states_223 +y + + +var_1506* + hidden_states +  + +{ +�*# +name + +" + hidden_states� +mul. +x) +' +%model_decoder_final_layer_norm_weight +y + + hidden_states. +last_hidden_state +  + +{ +�* +name + + " +input"� + buildInfo�" + + +~"| +8 +! + +" +coremltools-version + + " +7.0b1 +@ +) +! +" +coremltools-component-torch + + " +2.0.1 \ No newline at end of file