diff --git "a/coreml/text2text-generation/decoder_float32_model.mlpackage/Data/com.apple.CoreML/model.mlmodel" "b/coreml/text2text-generation/decoder_float32_model.mlpackage/Data/com.apple.CoreML/model.mlmodel" new file mode 100644--- /dev/null +++ "b/coreml/text2text-generation/decoder_float32_model.mlpackage/Data/com.apple.CoreML/model.mlmodel" @@ -0,0 +1,12914 @@ +� +\ +decoder_input_ids:Indices of decoder input sequence tokens in the vocabulary * +��� + +decoder_attention_maskXMask to avoid performing attention on padding token indices (1 = not masked, 0 = masked) * +��� +t +encoder_last_hidden_stateHSequence of hidden states at the output of the last layer of the encoder * +���� + +encoder_attention_maskXMask to avoid performing attention on padding token indices (1 = not masked, 0 = masked) * +���R@ +logits&Classification scores (before softmax)* +�؈���� +4sshleifer/distilbart-cnn-12-6 (text2text-generation)�3 +#com.github.apple.coremltools.source torch==2.0.1�+ +$com.github.apple.coremltools.version7.0�> +co.huggingface.exporters.namesshleifer/distilbart-cnn-12-6�5 +co.huggingface.exporters.tasktext2text-generation�E +%co.huggingface.exporters.architectureBartForConditionalGeneration�- +"co.huggingface.exporters.frameworkpytorch�- +"co.huggingface.exporters.precisionfloat32�" +transformers_version +4.7.0.dev0����� +main�� +( +decoder_input_ids + + +� +- +decoder_attention_mask + + +� +7 +encoder_last_hidden_state +  + +� +� +- +encoder_attention_mask + + +�CoreML5�� +CoreML5��logits� +const2 +model_model_shared_weight +  +؈ +�*/ +name' + +" +model_model_shared_weight*B +val; +  +؈ +�*" +@model_path/weights/weight.bin@� +const= +,model_model_decoder_layernorm_embedding_bias +   +�*B +name: +2 +0". +,model_model_decoder_layernorm_embedding_bias*= +val6 +   +�*% +@model_path/weights/weight.bin���b� +const? +.model_model_decoder_layernorm_embedding_weight +   +�*D +name< +4 +2"0 +.model_model_decoder_layernorm_embedding_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���b� +constC +2model_model_decoder_layers_0_self_attn_q_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_0_self_attn_q_proj_bias*= +val6 +   +�*% +@model_path/weights/weight.bin�–b� +constL +4model_model_decoder_layers_0_self_attn_q_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_0_self_attn_q_proj_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin��b� +constC +2model_model_decoder_layers_0_self_attn_k_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_0_self_attn_k_proj_bias*= +val6 +   +�*% +@model_path/weights/weight.bin��d� +constL +4model_model_decoder_layers_0_self_attn_k_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_0_self_attn_k_proj_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���d� +constC +2model_model_decoder_layers_0_self_attn_v_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_0_self_attn_v_proj_bias*= +val6 +   +�*% +@model_path/weights/weight.bin���f� +constL +4model_model_decoder_layers_0_self_attn_v_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_0_self_attn_v_proj_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���f� +constE +4model_model_decoder_layers_0_self_attn_out_proj_bias +   +�*J +nameB +: +8"6 +4model_model_decoder_layers_0_self_attn_out_proj_bias*= +val6 +   +�*% +@model_path/weights/weight.bin���h� +constN +6model_model_decoder_layers_0_self_attn_out_proj_weight +  +� +�*L +nameD +< +:"8 +6model_model_decoder_layers_0_self_attn_out_proj_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�ŗh� +constG +6model_model_decoder_layers_0_self_attn_layer_norm_bias +   +�*L +nameD +< +:"8 +6model_model_decoder_layers_0_self_attn_layer_norm_bias*= +val6 +   +�*% +@model_path/weights/weight.bin�Ɨj� +constI +8model_model_decoder_layers_0_self_attn_layer_norm_weight +   +�*N +nameF +> +<": +8model_model_decoder_layers_0_self_attn_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin��j� +constF +5model_model_decoder_layers_0_encoder_attn_q_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_0_encoder_attn_q_proj_bias*= +val6 +   +�*% +@model_path/weights/weight.bin���j� +constO +7model_model_decoder_layers_0_encoder_attn_q_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_0_encoder_attn_q_proj_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���j� +constF +5model_model_decoder_layers_0_encoder_attn_k_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_0_encoder_attn_k_proj_bias*= +val6 +   +�*% +@model_path/weights/weight.bin���l� +constO +7model_model_decoder_layers_0_encoder_attn_k_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_0_encoder_attn_k_proj_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin�Șl� +constF +5model_model_decoder_layers_0_encoder_attn_v_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_0_encoder_attn_v_proj_bias*= +val6 +   +�*% +@model_path/weights/weight.bin�ɘn� +constO +7model_model_decoder_layers_0_encoder_attn_v_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_0_encoder_attn_v_proj_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin��n� +constH +7model_model_decoder_layers_0_encoder_attn_out_proj_bias +   +�*M +nameE += +;"9 +7model_model_decoder_layers_0_encoder_attn_out_proj_bias*= +val6 +   +�*% +@model_path/weights/weight.bin��p� +constQ +9model_model_decoder_layers_0_encoder_attn_out_proj_weight +  +� +�*O +nameG +? +="; +9model_model_decoder_layers_0_encoder_attn_out_proj_weight*D +val= +  +� +�*% +@model_path/weights/weight.bin���p� +constJ +9model_model_decoder_layers_0_encoder_attn_layer_norm_bias +   +�*O +nameG +? +="; +9model_model_decoder_layers_0_encoder_attn_layer_norm_bias*= +val6 +   +�*% +@model_path/weights/weight.bin���r� +constL +;model_model_decoder_layers_0_encoder_attn_layer_norm_weight +   +�*Q +nameI +A +?"= +;model_model_decoder_layers_0_encoder_attn_layer_norm_weight*= +val6 +   +�*% +@model_path/weights/weight.bin���r� +const6 +%model_model_decoder_layers_0_fc1_bias +   +� *; +name3 ++ +)"' +%model_model_decoder_layers_0_fc1_bias*= +val6 +   +� *% +@model_path/weights/weight.bin�̙r� +const? +'model_model_decoder_layers_0_fc1_weight +  +�  +�*= +name5 +- ++") +'model_model_decoder_layers_0_fc1_weight*D +val= +  +�  +�*% +@model_path/weights/weight.bin�̚r� +const6 +%model_model_decoder_layers_0_fc2_bias +   +�*; +name3 ++ +)"' +%model_model_decoder_layers_0_fc2_bias*= +val6 +   +�*% +@model_path/weights/weight.bin�͚z� +const? +'model_model_decoder_layers_0_fc2_weight +  +� +� *= +name5 +- ++") +'model_model_decoder_layers_0_fc2_weight*D +val= +  +� +� *% +@model_path/weights/weight.bin��z� +constC +2model_model_decoder_layers_0_final_layer_norm_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_0_final_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�� +constE +4model_model_decoder_layers_0_final_layer_norm_weight +   +�*J +nameB +: +8"6 +4model_model_decoder_layers_0_final_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constC +2model_model_decoder_layers_1_self_attn_q_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_1_self_attn_q_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constL +4model_model_decoder_layers_1_self_attn_q_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_1_self_attn_q_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin�ϛ�� +constC +2model_model_decoder_layers_1_self_attn_k_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_1_self_attn_k_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�Л�� +constL +4model_model_decoder_layers_1_self_attn_k_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_1_self_attn_k_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin��� +constC +2model_model_decoder_layers_1_self_attn_v_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_1_self_attn_v_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin��� +constL +4model_model_decoder_layers_1_self_attn_v_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_1_self_attn_v_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constE +4model_model_decoder_layers_1_self_attn_out_proj_bias +   +�*J +nameB +: +8"6 +4model_model_decoder_layers_1_self_attn_out_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constN +6model_model_decoder_layers_1_self_attn_out_proj_weight +  +� +�*L +nameD +< +:"8 +6model_model_decoder_layers_1_self_attn_out_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constG +6model_model_decoder_layers_1_self_attn_layer_norm_bias +   +�*L +nameD +< +:"8 +6model_model_decoder_layers_1_self_attn_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constI +8model_model_decoder_layers_1_self_attn_layer_norm_weight +   +�*N +nameF +> +<": +8model_model_decoder_layers_1_self_attn_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin�Ӝ�� +constF +5model_model_decoder_layers_1_encoder_attn_q_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_1_encoder_attn_q_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constO +7model_model_decoder_layers_1_encoder_attn_q_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_1_encoder_attn_q_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constF +5model_model_decoder_layers_1_encoder_attn_k_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_1_encoder_attn_k_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constO +7model_model_decoder_layers_1_encoder_attn_k_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_1_encoder_attn_k_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constF +5model_model_decoder_layers_1_encoder_attn_v_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_1_encoder_attn_v_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constO +7model_model_decoder_layers_1_encoder_attn_v_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_1_encoder_attn_v_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin�֝�� +constH +7model_model_decoder_layers_1_encoder_attn_out_proj_bias +   +�*M +nameE += +;"9 +7model_model_decoder_layers_1_encoder_attn_out_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�ם�� +constQ +9model_model_decoder_layers_1_encoder_attn_out_proj_weight +  +� +�*O +nameG +? +="; +9model_model_decoder_layers_1_encoder_attn_out_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constJ +9model_model_decoder_layers_1_encoder_attn_layer_norm_bias +   +�*O +nameG +? +="; +9model_model_decoder_layers_1_encoder_attn_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constL +;model_model_decoder_layers_1_encoder_attn_layer_norm_weight +   +�*Q +nameI +A +?"= +;model_model_decoder_layers_1_encoder_attn_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin����� +const6 +%model_model_decoder_layers_1_fc1_bias +   +� *; +name3 ++ +)"' +%model_model_decoder_layers_1_fc1_bias*> +val7 +   +� *& +@model_path/weights/weight.bin����� +const? +'model_model_decoder_layers_1_fc1_weight +  +�  +�*= +name5 +- ++") +'model_model_decoder_layers_1_fc1_weight*E +val> +  +�  +�*& +@model_path/weights/weight.bin����� +const6 +%model_model_decoder_layers_1_fc2_bias +   +�*; +name3 ++ +)"' +%model_model_decoder_layers_1_fc2_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +const? +'model_model_decoder_layers_1_fc2_weight +  +� +� *= +name5 +- ++") +'model_model_decoder_layers_1_fc2_weight*E +val> +  +� +� *& +@model_path/weights/weight.bin�ڟ�� +constC +2model_model_decoder_layers_1_final_layer_norm_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_1_final_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�۟�� +constE +4model_model_decoder_layers_1_final_layer_norm_weight +   +�*J +nameB +: +8"6 +4model_model_decoder_layers_1_final_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constC +2model_model_decoder_layers_2_self_attn_q_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_2_self_attn_q_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constL +4model_model_decoder_layers_2_self_attn_q_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_2_self_attn_q_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constC +2model_model_decoder_layers_2_self_attn_k_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_2_self_attn_k_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constL +4model_model_decoder_layers_2_self_attn_k_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_2_self_attn_k_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin�ݠ�� +constC +2model_model_decoder_layers_2_self_attn_v_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_2_self_attn_v_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�ޠ�� +constL +4model_model_decoder_layers_2_self_attn_v_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_2_self_attn_v_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constE +4model_model_decoder_layers_2_self_attn_out_proj_bias +   +�*J +nameB +: +8"6 +4model_model_decoder_layers_2_self_attn_out_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constN +6model_model_decoder_layers_2_self_attn_out_proj_weight +  +� +�*L +nameD +< +:"8 +6model_model_decoder_layers_2_self_attn_out_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constG +6model_model_decoder_layers_2_self_attn_layer_norm_bias +   +�*L +nameD +< +:"8 +6model_model_decoder_layers_2_self_attn_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constI +8model_model_decoder_layers_2_self_attn_layer_norm_weight +   +�*N +nameF +> +<": +8model_model_decoder_layers_2_self_attn_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constF +5model_model_decoder_layers_2_encoder_attn_q_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_2_encoder_attn_q_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�ᡪ� +constO +7model_model_decoder_layers_2_encoder_attn_q_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_2_encoder_attn_q_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constF +5model_model_decoder_layers_2_encoder_attn_k_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_2_encoder_attn_k_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constO +7model_model_decoder_layers_2_encoder_attn_k_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_2_encoder_attn_k_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constF +5model_model_decoder_layers_2_encoder_attn_v_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_2_encoder_attn_v_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constO +7model_model_decoder_layers_2_encoder_attn_v_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_2_encoder_attn_v_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin�â�� +constH +7model_model_decoder_layers_2_encoder_attn_out_proj_bias +   +�*M +nameE += +;"9 +7model_model_decoder_layers_2_encoder_attn_out_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�Ģ�� +constQ +9model_model_decoder_layers_2_encoder_attn_out_proj_weight +  +� +�*O +nameG +? +="; +9model_model_decoder_layers_2_encoder_attn_out_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin�䢰� +constJ +9model_model_decoder_layers_2_encoder_attn_layer_norm_bias +   +�*O +nameG +? +="; +9model_model_decoder_layers_2_encoder_attn_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�墲� +constL +;model_model_decoder_layers_2_encoder_attn_layer_norm_weight +   +�*Q +nameI +A +?"= +;model_model_decoder_layers_2_encoder_attn_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin����� +const6 +%model_model_decoder_layers_2_fc1_bias +   +� *; +name3 ++ +)"' +%model_model_decoder_layers_2_fc1_bias*> +val7 +   +� *& +@model_path/weights/weight.bin����� +const? +'model_model_decoder_layers_2_fc1_weight +  +�  +�*= +name5 +- ++") +'model_model_decoder_layers_2_fc1_weight*E +val> +  +�  +�*& +@model_path/weights/weight.bin����� +const6 +%model_model_decoder_layers_2_fc2_bias +   +�*; +name3 ++ +)"' +%model_model_decoder_layers_2_fc2_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +const? +'model_model_decoder_layers_2_fc2_weight +  +� +� *= +name5 +- ++") +'model_model_decoder_layers_2_fc2_weight*E +val> +  +� +� *& +@model_path/weights/weight.bin�Ǥ�� +constC +2model_model_decoder_layers_2_final_layer_norm_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_2_final_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�Ȥ�� +constE +4model_model_decoder_layers_2_final_layer_norm_weight +   +�*J +nameB +: +8"6 +4model_model_decoder_layers_2_final_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin���� +constC +2model_model_decoder_layers_3_self_attn_q_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_3_self_attn_q_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constL +4model_model_decoder_layers_3_self_attn_q_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_3_self_attn_q_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constC +2model_model_decoder_layers_3_self_attn_k_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_3_self_attn_k_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constL +4model_model_decoder_layers_3_self_attn_k_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_3_self_attn_k_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin�ʥ�� +constC +2model_model_decoder_layers_3_self_attn_v_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_3_self_attn_v_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�˥�� +constL +4model_model_decoder_layers_3_self_attn_v_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_3_self_attn_v_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin���� +constE +4model_model_decoder_layers_3_self_attn_out_proj_bias +   +�*J +nameB +: +8"6 +4model_model_decoder_layers_3_self_attn_out_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin���� +constN +6model_model_decoder_layers_3_self_attn_out_proj_weight +  +� +�*L +nameD +< +:"8 +6model_model_decoder_layers_3_self_attn_out_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constG +6model_model_decoder_layers_3_self_attn_layer_norm_bias +   +�*L +nameD +< +:"8 +6model_model_decoder_layers_3_self_attn_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constI +8model_model_decoder_layers_3_self_attn_layer_norm_weight +   +�*N +nameF +> +<": +8model_model_decoder_layers_3_self_attn_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constF +5model_model_decoder_layers_3_encoder_attn_q_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_3_encoder_attn_q_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�Φ�� +constO +7model_model_decoder_layers_3_encoder_attn_q_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_3_encoder_attn_q_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin���� +constF +5model_model_decoder_layers_3_encoder_attn_k_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_3_encoder_attn_k_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin���� +constO +7model_model_decoder_layers_3_encoder_attn_k_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_3_encoder_attn_k_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constF +5model_model_decoder_layers_3_encoder_attn_v_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_3_encoder_attn_v_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constO +7model_model_decoder_layers_3_encoder_attn_v_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_3_encoder_attn_v_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constH +7model_model_decoder_layers_3_encoder_attn_out_proj_bias +   +�*M +nameE += +;"9 +7model_model_decoder_layers_3_encoder_attn_out_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constQ +9model_model_decoder_layers_3_encoder_attn_out_proj_weight +  +� +�*O +nameG +? +="; +9model_model_decoder_layers_3_encoder_attn_out_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin�ѧ�� +constJ +9model_model_decoder_layers_3_encoder_attn_layer_norm_bias +   +�*O +nameG +? +="; +9model_model_decoder_layers_3_encoder_attn_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�ҧ�� +constL +;model_model_decoder_layers_3_encoder_attn_layer_norm_weight +   +�*Q +nameI +A +?"= +;model_model_decoder_layers_3_encoder_attn_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin���� +const6 +%model_model_decoder_layers_3_fc1_bias +   +� *; +name3 ++ +)"' +%model_model_decoder_layers_3_fc1_bias*> +val7 +   +� *& +@model_path/weights/weight.bin����� +const? +'model_model_decoder_layers_3_fc1_weight +  +�  +�*= +name5 +- ++") +'model_model_decoder_layers_3_fc1_weight*E +val> +  +�  +�*& +@model_path/weights/weight.bin����� +const6 +%model_model_decoder_layers_3_fc2_bias +   +�*; +name3 ++ +)"' +%model_model_decoder_layers_3_fc2_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +const? +'model_model_decoder_layers_3_fc2_weight +  +� +� *= +name5 +- ++") +'model_model_decoder_layers_3_fc2_weight*E +val> +  +� +� *& +@model_path/weights/weight.bin����� +constC +2model_model_decoder_layers_3_final_layer_norm_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_3_final_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constE +4model_model_decoder_layers_3_final_layer_norm_weight +   +�*J +nameB +: +8"6 +4model_model_decoder_layers_3_final_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin�թ�� +constC +2model_model_decoder_layers_4_self_attn_q_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_4_self_attn_q_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constL +4model_model_decoder_layers_4_self_attn_q_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_4_self_attn_q_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constC +2model_model_decoder_layers_4_self_attn_k_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_4_self_attn_k_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constL +4model_model_decoder_layers_4_self_attn_k_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_4_self_attn_k_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constC +2model_model_decoder_layers_4_self_attn_v_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_4_self_attn_v_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constL +4model_model_decoder_layers_4_self_attn_v_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_4_self_attn_v_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin�ت�� +constE +4model_model_decoder_layers_4_self_attn_out_proj_bias +   +�*J +nameB +: +8"6 +4model_model_decoder_layers_4_self_attn_out_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�٪�� +constN +6model_model_decoder_layers_4_self_attn_out_proj_weight +  +� +�*L +nameD +< +:"8 +6model_model_decoder_layers_4_self_attn_out_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constG +6model_model_decoder_layers_4_self_attn_layer_norm_bias +   +�*L +nameD +< +:"8 +6model_model_decoder_layers_4_self_attn_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constI +8model_model_decoder_layers_4_self_attn_layer_norm_weight +   +�*N +nameF +> +<": +8model_model_decoder_layers_4_self_attn_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constF +5model_model_decoder_layers_4_encoder_attn_q_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_4_encoder_attn_q_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constO +7model_model_decoder_layers_4_encoder_attn_q_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_4_encoder_attn_q_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin�۫�� +constF +5model_model_decoder_layers_4_encoder_attn_k_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_4_encoder_attn_k_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�ܫ�� +constO +7model_model_decoder_layers_4_encoder_attn_k_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_4_encoder_attn_k_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constF +5model_model_decoder_layers_4_encoder_attn_v_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_4_encoder_attn_v_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constO +7model_model_decoder_layers_4_encoder_attn_v_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_4_encoder_attn_v_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constH +7model_model_decoder_layers_4_encoder_attn_out_proj_bias +   +�*M +nameE += +;"9 +7model_model_decoder_layers_4_encoder_attn_out_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constQ +9model_model_decoder_layers_4_encoder_attn_out_proj_weight +  +� +�*O +nameG +? +="; +9model_model_decoder_layers_4_encoder_attn_out_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constJ +9model_model_decoder_layers_4_encoder_attn_layer_norm_bias +   +�*O +nameG +? +="; +9model_model_decoder_layers_4_encoder_attn_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constL +;model_model_decoder_layers_4_encoder_attn_layer_norm_weight +   +�*Q +nameI +A +?"= +;model_model_decoder_layers_4_encoder_attn_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin�߬�� +const6 +%model_model_decoder_layers_4_fc1_bias +   +� *; +name3 ++ +)"' +%model_model_decoder_layers_4_fc1_bias*> +val7 +   +� *& +@model_path/weights/weight.bin����� +const? +'model_model_decoder_layers_4_fc1_weight +  +�  +�*= +name5 +- ++") +'model_model_decoder_layers_4_fc1_weight*E +val> +  +�  +�*& +@model_path/weights/weight.bin����� +const6 +%model_model_decoder_layers_4_fc2_bias +   +�*; +name3 ++ +)"' +%model_model_decoder_layers_4_fc2_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +const? +'model_model_decoder_layers_4_fc2_weight +  +� +� *= +name5 +- ++") +'model_model_decoder_layers_4_fc2_weight*E +val> +  +� +� *& +@model_path/weights/weight.bin����� +constC +2model_model_decoder_layers_4_final_layer_norm_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_4_final_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constE +4model_model_decoder_layers_4_final_layer_norm_weight +   +�*J +nameB +: +8"6 +4model_model_decoder_layers_4_final_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin�®�� +constC +2model_model_decoder_layers_5_self_attn_q_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_5_self_attn_q_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�㮂� +constL +4model_model_decoder_layers_5_self_attn_q_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_5_self_attn_q_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constC +2model_model_decoder_layers_5_self_attn_k_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_5_self_attn_k_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constL +4model_model_decoder_layers_5_self_attn_k_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_5_self_attn_k_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constC +2model_model_decoder_layers_5_self_attn_v_proj_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_5_self_attn_v_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constL +4model_model_decoder_layers_5_self_attn_v_proj_weight +  +� +�*J +nameB +: +8"6 +4model_model_decoder_layers_5_self_attn_v_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin�ů�� +constE +4model_model_decoder_layers_5_self_attn_out_proj_bias +   +�*J +nameB +: +8"6 +4model_model_decoder_layers_5_self_attn_out_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�Ư�� +constN +6model_model_decoder_layers_5_self_attn_out_proj_weight +  +� +�*L +nameD +< +:"8 +6model_model_decoder_layers_5_self_attn_out_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin�毈� +constG +6model_model_decoder_layers_5_self_attn_layer_norm_bias +   +�*L +nameD +< +:"8 +6model_model_decoder_layers_5_self_attn_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�篊� +constI +8model_model_decoder_layers_5_self_attn_layer_norm_weight +   +�*N +nameF +> +<": +8model_model_decoder_layers_5_self_attn_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constF +5model_model_decoder_layers_5_encoder_attn_q_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_5_encoder_attn_q_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constO +7model_model_decoder_layers_5_encoder_attn_q_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_5_encoder_attn_q_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin�Ȱ�� +constF +5model_model_decoder_layers_5_encoder_attn_k_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_5_encoder_attn_k_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�ɰ�� +constO +7model_model_decoder_layers_5_encoder_attn_k_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_5_encoder_attn_k_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin�鰌� +constF +5model_model_decoder_layers_5_encoder_attn_v_proj_bias +   +�*K +nameC +; +9"7 +5model_model_decoder_layers_5_encoder_attn_v_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�갎� +constO +7model_model_decoder_layers_5_encoder_attn_v_proj_weight +  +� +�*M +nameE += +;"9 +7model_model_decoder_layers_5_encoder_attn_v_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constH +7model_model_decoder_layers_5_encoder_attn_out_proj_bias +   +�*M +nameE += +;"9 +7model_model_decoder_layers_5_encoder_attn_out_proj_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constQ +9model_model_decoder_layers_5_encoder_attn_out_proj_weight +  +� +�*O +nameG +? +="; +9model_model_decoder_layers_5_encoder_attn_out_proj_weight*E +val> +  +� +�*& +@model_path/weights/weight.bin����� +constJ +9model_model_decoder_layers_5_encoder_attn_layer_norm_bias +   +�*O +nameG +? +="; +9model_model_decoder_layers_5_encoder_attn_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constL +;model_model_decoder_layers_5_encoder_attn_layer_norm_weight +   +�*Q +nameI +A +?"= +;model_model_decoder_layers_5_encoder_attn_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin�̱�� +const6 +%model_model_decoder_layers_5_fc1_bias +   +� *; +name3 ++ +)"' +%model_model_decoder_layers_5_fc1_bias*> +val7 +   +� *& +@model_path/weights/weight.bin����� +const? +'model_model_decoder_layers_5_fc1_weight +  +�  +�*= +name5 +- ++") +'model_model_decoder_layers_5_fc1_weight*E +val> +  +�  +�*& +@model_path/weights/weight.bin����� +const6 +%model_model_decoder_layers_5_fc2_bias +   +�*; +name3 ++ +)"' +%model_model_decoder_layers_5_fc2_bias*> +val7 +   +�*& +@model_path/weights/weight.bin�� +const? +'model_model_decoder_layers_5_fc2_weight +  +� +� *= +name5 +- ++") +'model_model_decoder_layers_5_fc2_weight*E +val> +  +� +� *& +@model_path/weights/weight.bin����� +constC +2model_model_decoder_layers_5_final_layer_norm_bias +   +�*H +name@ +8 +6"4 +2model_model_decoder_layers_5_final_layer_norm_bias*> +val7 +   +�*& +@model_path/weights/weight.bin����� +constE +4model_model_decoder_layers_5_final_layer_norm_weight +   +�*J +nameB +: +8"6 +4model_model_decoder_layers_5_final_layer_norm_weight*> +val7 +   +�*& +@model_path/weights/weight.bin����O +const +var_12 + * +name + + " +op_12* +val +  + + + +��'7O +const +var_16 + * +name + + " +op_16* +val +  + + + +�?U +const +var_21 +* +name + + " +op_21* +val + + + +���������O +const +var_24 + * +name + + " +op_24* +val +  + + + +���Z +const + var_51_axis_0 +*" +name + +" + op_51_axis_0* +val + + +� +gather" +x + +model_model_shared_weight +indices + +decoder_input_ids +axis + + var_51_axis_0$ +var_51 +  + +� +�* +name + + " +op_51� +const* +var_67 +  + + +� +�* +name + + " +op_67*Q +valJ +  + + +� +�*& +@model_path/weights/weight.bin�г�j +const + var_78_axes_0 + + +*" +name + +" + op_78_axes_0* +val + + + + +� + expand_dims +x + +decoder_attention_mask +axes + + var_78_axes_0# +var_78 + + + +�* +name + + " +op_78j +const + var_79_axes_0 + + +*" +name + +" + op_79_axes_0* +val + + + + +� + expand_dims +x + + +var_78 +axes + + var_79_axes_0) +var_79 + + + + +�* +name + + " +op_79n +const + var_82_reps_0 + + +*" +name + +" + op_82_reps_0*" +val + + + +  +�{ +tile +x + + +var_79 +reps + + var_82_reps_0* +var_82 + + + +� +�* +name + + " +op_82_ +const +var_83_dtype_0 +*# +name + +" + op_83_dtype_0* +val + + +" +fp32� +cast +x + + +var_82 +dtype + +var_83_dtype_0, +cast_127 +  + + +� +�* +name + + " + +cast_127� +sub +x + + +var_16 +y + + +cast_1273 +inverted_mask_1 +  + + +� +�*% +name + +" +inverted_mask_1_ +const +var_85_dtype_0 +*# +name + +" + op_85_dtype_0* +val + + +" +bool� +cast +x + +inverted_mask_1 +dtype + +var_85_dtype_0, +cast_126 + + + +� +�* +name + + " + +cast_126� +select +cond + + +cast_126 +a + + +var_24 +b + +inverted_mask_1* +var_86 +  + + +� +�* +name + + " +op_86� +add +x + + +var_86 +y + + +var_674 +attention_mask_1 +  + + +� +�*& +name + +" +attention_mask_1j +const + var_92_axes_0 + + +*" +name + +" + op_92_axes_0* +val + + + + +� + expand_dims +x + +encoder_attention_mask +axes + + var_92_axes_0# +var_92 + + + +�* +name + + " +op_92j +const + var_93_axes_0 + + +*" +name + +" + op_93_axes_0* +val + + + + +� + expand_dims +x + + +var_92 +axes + + var_93_axes_0) +var_93 + + + + +�* +name + + " +op_93n +const + var_96_reps_0 + + +*" +name + +" + op_96_reps_0*" +val + + + +  +�{ +tile +x + + +var_93 +reps + + var_96_reps_0* +var_96 + + + +� +�* +name + + " +op_96_ +const +var_97_dtype_0 +*# +name + +" + op_97_dtype_0* +val + + +" +fp32� +cast +x + + +var_96 +dtype + +var_97_dtype_0, +cast_125 +  + + +� +�* +name + + " + +cast_125� +sub +x + + +var_16 +y + + +cast_1251 + inverted_mask +  + + +� +�*# +name + +" + inverted_mask_ +const +var_99_dtype_0 +*# +name + +" + op_99_dtype_0* +val + + +" +bool� +cast +x + + inverted_mask +dtype + +var_99_dtype_0, +cast_124 + + + +� +�* +name + + " + +cast_124� +select +cond + + +cast_124 +a + + +var_24 +b + + inverted_mask2 +attention_mask +  + + +� +�*$ +name + +" +attention_mask� +const' + positions +  + +� +�* +name + + " + positions*K +valD +  + +� +�*& +@model_path/weights/weight.bin�з�p +add +x + + +var_51 +y + + positions% +input_3 +  + +� +�* +name + + " +input_3v +const +input_5_axes_0 + + +*$ +name + +" +input_5_axes_0*' +val  + + + + + +���������� + +layer_norm +x + +input_3 +axes + +input_5_axes_0; +gamma2 +0 +.model_model_decoder_layernorm_embedding_weight8 +beta0 +. +,model_model_decoder_layernorm_embedding_bias +epsilon + + +var_12% +input_5 +  + +� +�* +name + + " +input_5� +linear +x + +input_5B +weight8 +6 +4model_model_decoder_layers_0_self_attn_q_proj_weight> +bias6 +4 +2model_model_decoder_layers_0_self_attn_q_proj_bias& +linear_0 +  + +� +�* +name + + " + +linear_0Q +const +var_138 + * +name + + +" +op_138* +val +  + + + +>r +mul +x + + +linear_0 +y + +var_138& +tensor_5 +  + +� +�* +name + + " + +tensor_5� +linear +x + +input_5B +weight8 +6 +4model_model_decoder_layers_0_self_attn_k_proj_weight> +bias6 +4 +2model_model_decoder_layers_0_self_attn_k_proj_bias& +linear_1 +  + +� +�* +name + + " + +linear_1j +const +var_143 + + +* +name + + +" +op_143** +val# + + + + + ���������@| +reshape +x + + +linear_1 +shape + +var_143* +var_144 +  + +� + +@* +name + + +" +op_144o +const +var_145_perm_0 + + +*# +name + +" + op_145_perm_0*! +val + + + + + +� +linear +x + +input_5B +weight8 +6 +4model_model_decoder_layers_0_self_attn_v_proj_weight> +bias6 +4 +2model_model_decoder_layers_0_self_attn_v_proj_bias& +linear_2 +  + +� +�* +name + + " + +linear_2j +const +var_150 + + +* +name + + +" +op_150** +val# + + + + + ���������@| +reshape +x + + +linear_2 +shape + +var_150* +var_151 +  + +� + +@* +name + + +" +op_151o +const +var_152_perm_0 + + +*# +name + +" + op_152_perm_0*! +val + + + + + +b +const +var_159 + + +* +name + + +" +op_159*" +val + + + +  +�@| +reshape +x + + +tensor_5 +shape + +var_159* +var_160 +  + +� + +@* +name + + +" +op_160o +const +var_161_perm_0 + + +*# +name + +" + op_161_perm_0*! +val + + + + + +i +const +var_163 + + +* +name + + +" +op_163*) +val" + + + + + ���������@� + transpose +x + +var_160 +perm + +var_161_perm_0/ + transpose_57 +  + + +� +@*" +name + +" + transpose_57� +reshape +x + + transpose_57 +shape + +var_163+ +query_states_1 +  + +� +@*$ +name + +" +query_states_1i +const +var_165 + + +* +name + + +" +op_165*) +val" + + + + + ���������@� + transpose +x + +var_144 +perm + +var_145_perm_0/ + transpose_59 +  + + +� +@*" +name + +" + transpose_59� +reshape +x + + transpose_59 +shape + +var_165) + key_states_3 +  + +� +@*" +name + +" + key_states_3i +const +var_167 + + +* +name + + +" +op_167*) +val" + + + + + ���������@� + transpose +x + +var_151 +perm + +var_152_perm_0/ + transpose_58 +  + + +� +@*" +name + +" + transpose_58� +reshape +x + + transpose_58 +shape + +var_167+ +value_states_3 +  + +� +@*$ +name + +" +value_states_3n +const +var_170_perm_0 + + +*# +name + +" + op_170_perm_0* +val + + + + +y +const$ +attn_weights_1_transpose_x_0 +*2 +name* +" + " +attn_weights_1_transpose_x_0* +val + + +y +const$ +attn_weights_1_transpose_y_0 +*2 +name* +" + " +attn_weights_1_transpose_y_0* +val + + +� + transpose +x + + key_states_3 +perm + +var_170_perm_0) + transpose_56 +  + +@ +�*" +name + +" + transpose_56� +matmul +x + +query_states_1 +y + + transpose_56/ + transpose_x + +attn_weights_1_transpose_x_0/ + transpose_y + +attn_weights_1_transpose_y_0, +attn_weights_1 +  + +� +�*$ +name + +" +attn_weights_1c +const +var_172 + + +* +name + + +" +op_172*# +val + + + + + +��� +reshape +x + +attn_weights_1 +shape + +var_172+ +var_173 +  + + +� +�* +name + + +" +op_173� +add +x + +var_173 +y + +attention_mask_12 +attn_weights_3 +  + + +� +�*$ +name + +" +attn_weights_3b +const +var_178 + + +* +name + + +" +op_178*" +val + + + +  +��~ +reshape +x + +attn_weights_3 +shape + +var_178% +input_7 +  + +� +�* +name + + " +input_7u +softmax +x + +input_7 +axis + + +var_21% +input_9 +  + +� +�* +name + + " +input_9w +const# +attn_output_1_transpose_x_0 +*1 +name) +! +" +attn_output_1_transpose_x_0* +val + + +w +const# +attn_output_1_transpose_y_0 +*1 +name) +! +" +attn_output_1_transpose_y_0* +val + + +� +matmul +x + +input_9 +y + +value_states_3. + transpose_x + +attn_output_1_transpose_x_0. + transpose_y + +attn_output_1_transpose_y_0* + attn_output_1 +  + +� +@*# +name + +" + attn_output_1b +const +var_183 + + +* +name + + +" +op_183*" +val + + + +  +�@� +reshape +x + + attn_output_1 +shape + +var_1830 + attn_output_3 +  + + +� +@*# +name + +" + attn_output_3| +const$ +attn_output_5_perm_0 + + +** +name" + +" +attn_output_5_perm_0*! +val + + + + + +b +const +var_186 + + +* +name + + +" +op_186*" +val + + + +  +��� + transpose +x + + attn_output_3 +perm + +attn_output_5_perm_0/ + transpose_55 +  + +� + +@*" +name + +" + transpose_55~ +reshape +x + + transpose_55 +shape + +var_186& +input_11 +  + +� +�* +name + + " + +input_11� +linear +x + + +input_11D +weight: +8 +6model_model_decoder_layers_0_self_attn_out_proj_weight@ +bias8 +6 +4model_model_decoder_layers_0_self_attn_out_proj_bias& +linear_3 +  + +� +�* +name + + " + +linear_3r +add +x + +input_5 +y + + +linear_3& +input_15 +  + +� +�* +name + + " + +input_15� +const& +hidden_states_5_axes_0 + + +*, +name$ + +" +hidden_states_5_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + +input_15" +axes + +hidden_states_5_axes_0E +gamma< +: +8model_model_decoder_layers_0_self_attn_layer_norm_weightB +beta: +8 +6model_model_decoder_layers_0_self_attn_layer_norm_bias +epsilon + + +var_12- +hidden_states_5 +  + +� +�*% +name + +" +hidden_states_5� +linear +x + +hidden_states_5E +weight; +9 +7model_model_decoder_layers_0_encoder_attn_q_proj_weightA +bias9 +7 +5model_model_decoder_layers_0_encoder_attn_q_proj_bias& +linear_4 +  + +� +�* +name + + " + +linear_4Q +const +var_207 + * +name + + +" +op_207* +val +  + + + +>t +mul +x + + +linear_4 +y + +var_207' + tensor_11 +  + +� +�* +name + + " + tensor_11� +linear" +x + +encoder_last_hidden_stateE +weight; +9 +7model_model_decoder_layers_0_encoder_attn_k_proj_weightA +bias9 +7 +5model_model_decoder_layers_0_encoder_attn_k_proj_bias& +linear_5 +  + +� +�* +name + + " + +linear_5j +const +var_212 + + +* +name + + +" +op_212** +val# + + + + + ���������@| +reshape +x + + +linear_5 +shape + +var_212* +var_213 +  + +� + +@* +name + + +" +op_213o +const +var_214_perm_0 + + +*# +name + +" + op_214_perm_0*! +val + + + + + +� +linear" +x + +encoder_last_hidden_stateE +weight; +9 +7model_model_decoder_layers_0_encoder_attn_v_proj_weightA +bias9 +7 +5model_model_decoder_layers_0_encoder_attn_v_proj_bias& +linear_6 +  + +� +�* +name + + " + +linear_6j +const +var_219 + + +* +name + + +" +op_219** +val# + + + + + ���������@| +reshape +x + + +linear_6 +shape + +var_219* +var_220 +  + +� + +@* +name + + +" +op_220o +const +var_221_perm_0 + + +*# +name + +" + op_221_perm_0*! +val + + + + + +b +const +var_228 + + +* +name + + +" +op_228*" +val + + + +  +�@} +reshape +x + + tensor_11 +shape + +var_228* +var_229 +  + +� + +@* +name + + +" +op_229o +const +var_230_perm_0 + + +*# +name + +" + op_230_perm_0*! +val + + + + + +i +const +var_232 + + +* +name + + +" +op_232*) +val" + + + + + ���������@� + transpose +x + +var_229 +perm + +var_230_perm_0/ + transpose_52 +  + + +� +@*" +name + +" + transpose_52� +reshape +x + + transpose_52 +shape + +var_232+ +query_states_3 +  + +� +@*$ +name + +" +query_states_3i +const +var_234 + + +* +name + + +" +op_234*) +val" + + + + + ���������@� + transpose +x + +var_213 +perm + +var_214_perm_0/ + transpose_54 +  + + +� +@*" +name + +" + transpose_54� +reshape +x + + transpose_54 +shape + +var_234) + key_states_7 +  + +� +@*" +name + +" + key_states_7i +const +var_236 + + +* +name + + +" +op_236*) +val" + + + + + ���������@� + transpose +x + +var_220 +perm + +var_221_perm_0/ + transpose_53 +  + + +� +@*" +name + +" + transpose_53� +reshape +x + + transpose_53 +shape + +var_236+ +value_states_7 +  + +� +@*$ +name + +" +value_states_7n +const +var_239_perm_0 + + +*# +name + +" + op_239_perm_0* +val + + + + +y +const$ +attn_weights_7_transpose_x_0 +*2 +name* +" + " +attn_weights_7_transpose_x_0* +val + + +y +const$ +attn_weights_7_transpose_y_0 +*2 +name* +" + " +attn_weights_7_transpose_y_0* +val + + +� + transpose +x + + key_states_7 +perm + +var_239_perm_0) + transpose_51 +  + +@ +�*" +name + +" + transpose_51� +matmul +x + +query_states_3 +y + + transpose_51/ + transpose_x + +attn_weights_7_transpose_x_0/ + transpose_y + +attn_weights_7_transpose_y_0, +attn_weights_7 +  + +� +�*$ +name + +" +attn_weights_7c +const +var_241 + + +* +name + + +" +op_241*# +val + + + + + +��� +reshape +x + +attn_weights_7 +shape + +var_241+ +var_242 +  + + +� +�* +name + + +" +op_242� +add +x + +var_242 +y + +attention_mask2 +attn_weights_9 +  + + +� +�*$ +name + +" +attn_weights_9b +const +var_247 + + +* +name + + +" +op_247*" +val + + + +  +��� +reshape +x + +attn_weights_9 +shape + +var_247& +input_19 +  + +� +�* +name + + " + +input_19x +softmax +x + + +input_19 +axis + + +var_21& +input_21 +  + +� +�* +name + + " + +input_21w +const# +attn_output_7_transpose_x_0 +*1 +name) +! +" +attn_output_7_transpose_x_0* +val + + +w +const# +attn_output_7_transpose_y_0 +*1 +name) +! +" +attn_output_7_transpose_y_0* +val + + +� +matmul +x + + +input_21 +y + +value_states_7. + transpose_x + +attn_output_7_transpose_x_0. + transpose_y + +attn_output_7_transpose_y_0* + attn_output_7 +  + +� +@*# +name + +" + attn_output_7b +const +var_252 + + +* +name + + +" +op_252*" +val + + + +  +�@� +reshape +x + + attn_output_7 +shape + +var_2520 + attn_output_9 +  + + +� +@*# +name + +" + attn_output_9~ +const% +attn_output_11_perm_0 + + +*+ +name# + +" +attn_output_11_perm_0*! +val + + + + + +b +const +var_255 + + +* +name + + +" +op_255*" +val + + + +  +��� + transpose +x + + attn_output_9! +perm + +attn_output_11_perm_0/ + transpose_50 +  + +� + +@*" +name + +" + transpose_50~ +reshape +x + + transpose_50 +shape + +var_255& +input_23 +  + +� +�* +name + + " + +input_23� +linear +x + + +input_23G +weight= +; +9model_model_decoder_layers_0_encoder_attn_out_proj_weightC +bias; +9 +7model_model_decoder_layers_0_encoder_attn_out_proj_bias& +linear_7 +  + +� +�* +name + + " + +linear_7z +add +x + +hidden_states_5 +y + + +linear_7& +input_27 +  + +� +�* +name + + " + +input_27x +const +input_29_axes_0 + + +*% +name + +" +input_29_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + +input_27 +axes + +input_29_axes_0H +gamma? += +;model_model_decoder_layers_0_encoder_attn_layer_norm_weightE +beta= +; +9model_model_decoder_layers_0_encoder_attn_layer_norm_bias +epsilon + + +var_12& +input_29 +  + +� +�* +name + + " + +input_29� +linear +x + + +input_295 +weight+ +) +'model_model_decoder_layers_0_fc1_weight1 +bias) +' +%model_model_decoder_layers_0_fc1_bias& +linear_8 +  + +� +� * +name + + " + +linear_8c +const +input_33_mode_0 +*% +name + +" +input_33_mode_0* +val + + " +EXACT~ +gelu +x + + +linear_8 +mode + +input_33_mode_0& +input_33 +  + +� +� * +name + + " + +input_33� +linear +x + + +input_335 +weight+ +) +'model_model_decoder_layers_0_fc2_weight1 +bias) +' +%model_model_decoder_layers_0_fc2_bias& +linear_9 +  + +� +�* +name + + " + +linear_9s +add +x + + +input_29 +y + + +linear_9& +input_39 +  + +� +�* +name + + " + +input_39� +const' +hidden_states_11_axes_0 + + +*- +name% + +" +hidden_states_11_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + +input_39# +axes + +hidden_states_11_axes_0A +gamma8 +6 +4model_model_decoder_layers_0_final_layer_norm_weight> +beta6 +4 +2model_model_decoder_layers_0_final_layer_norm_bias +epsilon + + +var_12. +hidden_states_11 +  + +� +�*& +name + +" +hidden_states_11� +linear +x + +hidden_states_11B +weight8 +6 +4model_model_decoder_layers_1_self_attn_q_proj_weight> +bias6 +4 +2model_model_decoder_layers_1_self_attn_q_proj_bias' + linear_10 +  + +� +�* +name + + " + linear_10Q +const +var_297 + * +name + + +" +op_297* +val +  + + + +>u +mul +x + + linear_10 +y + +var_297' + tensor_17 +  + +� +�* +name + + " + tensor_17� +linear +x + +hidden_states_11B +weight8 +6 +4model_model_decoder_layers_1_self_attn_k_proj_weight> +bias6 +4 +2model_model_decoder_layers_1_self_attn_k_proj_bias' + linear_11 +  + +� +�* +name + + " + linear_11j +const +var_302 + + +* +name + + +" +op_302** +val# + + + + + ���������@} +reshape +x + + linear_11 +shape + +var_302* +var_303 +  + +� + +@* +name + + +" +op_303o +const +var_304_perm_0 + + +*# +name + +" + op_304_perm_0*! +val + + + + + +� +linear +x + +hidden_states_11B +weight8 +6 +4model_model_decoder_layers_1_self_attn_v_proj_weight> +bias6 +4 +2model_model_decoder_layers_1_self_attn_v_proj_bias' + linear_12 +  + +� +�* +name + + " + linear_12j +const +var_309 + + +* +name + + +" +op_309** +val# + + + + + ���������@} +reshape +x + + linear_12 +shape + +var_309* +var_310 +  + +� + +@* +name + + +" +op_310o +const +var_311_perm_0 + + +*# +name + +" + op_311_perm_0*! +val + + + + + +b +const +var_318 + + +* +name + + +" +op_318*" +val + + + +  +�@} +reshape +x + + tensor_17 +shape + +var_318* +var_319 +  + +� + +@* +name + + +" +op_319o +const +var_320_perm_0 + + +*# +name + +" + op_320_perm_0*! +val + + + + + +i +const +var_322 + + +* +name + + +" +op_322*) +val" + + + + + ���������@� + transpose +x + +var_319 +perm + +var_320_perm_0/ + transpose_47 +  + + +� +@*" +name + +" + transpose_47� +reshape +x + + transpose_47 +shape + +var_322+ +query_states_5 +  + +� +@*$ +name + +" +query_states_5i +const +var_324 + + +* +name + + +" +op_324*) +val" + + + + + ���������@� + transpose +x + +var_303 +perm + +var_304_perm_0/ + transpose_49 +  + + +� +@*" +name + +" + transpose_49� +reshape +x + + transpose_49 +shape + +var_324* + key_states_11 +  + +� +@*# +name + +" + key_states_11i +const +var_326 + + +* +name + + +" +op_326*) +val" + + + + + ���������@� + transpose +x + +var_310 +perm + +var_311_perm_0/ + transpose_48 +  + + +� +@*" +name + +" + transpose_48� +reshape +x + + transpose_48 +shape + +var_326, +value_states_11 +  + +� +@*% +name + +" +value_states_11n +const +var_329_perm_0 + + +*# +name + +" + op_329_perm_0* +val + + + + +{ +const% +attn_weights_13_transpose_x_0 +*3 +name+ +# +!" +attn_weights_13_transpose_x_0* +val + + +{ +const% +attn_weights_13_transpose_y_0 +*3 +name+ +# +!" +attn_weights_13_transpose_y_0* +val + + +� + transpose +x + + key_states_11 +perm + +var_329_perm_0) + transpose_46 +  + +@ +�*" +name + +" + transpose_46� +matmul +x + +query_states_5 +y + + transpose_460 + transpose_x! + +attn_weights_13_transpose_x_00 + transpose_y! + +attn_weights_13_transpose_y_0- +attn_weights_13 +  + +� +�*% +name + +" +attn_weights_13c +const +var_331 + + +* +name + + +" +op_331*# +val + + + + + +��� +reshape +x + +attn_weights_13 +shape + +var_331+ +var_332 +  + + +� +�* +name + + +" +op_332� +add +x + +var_332 +y + +attention_mask_13 +attn_weights_15 +  + + +� +�*% +name + +" +attn_weights_15b +const +var_337 + + +* +name + + +" +op_337*" +val + + + +  +��� +reshape +x + +attn_weights_15 +shape + +var_337& +input_41 +  + +� +�* +name + + " + +input_41x +softmax +x + + +input_41 +axis + + +var_21& +input_43 +  + +� +�* +name + + " + +input_43y +const$ +attn_output_13_transpose_x_0 +*2 +name* +" + " +attn_output_13_transpose_x_0* +val + + +y +const$ +attn_output_13_transpose_y_0 +*2 +name* +" + " +attn_output_13_transpose_y_0* +val + + +� +matmul +x + + +input_43 +y + +value_states_11/ + transpose_x + +attn_output_13_transpose_x_0/ + transpose_y + +attn_output_13_transpose_y_0+ +attn_output_13 +  + +� +@*$ +name + +" +attn_output_13b +const +var_342 + + +* +name + + +" +op_342*" +val + + + +  +�@� +reshape +x + +attn_output_13 +shape + +var_3421 +attn_output_15 +  + + +� +@*$ +name + +" +attn_output_15~ +const% +attn_output_17_perm_0 + + +*+ +name# + +" +attn_output_17_perm_0*! +val + + + + + +b +const +var_345 + + +* +name + + +" +op_345*" +val + + + +  +��� + transpose +x + +attn_output_15! +perm + +attn_output_17_perm_0/ + transpose_45 +  + +� + +@*" +name + +" + transpose_45~ +reshape +x + + transpose_45 +shape + +var_345& +input_45 +  + +� +�* +name + + " + +input_45� +linear +x + + +input_45D +weight: +8 +6model_model_decoder_layers_1_self_attn_out_proj_weight@ +bias8 +6 +4model_model_decoder_layers_1_self_attn_out_proj_bias' + linear_13 +  + +� +�* +name + + " + linear_13| +add +x + +hidden_states_11 +y + + linear_13& +input_49 +  + +� +�* +name + + " + +input_49� +const' +hidden_states_15_axes_0 + + +*- +name% + +" +hidden_states_15_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + +input_49# +axes + +hidden_states_15_axes_0E +gamma< +: +8model_model_decoder_layers_1_self_attn_layer_norm_weightB +beta: +8 +6model_model_decoder_layers_1_self_attn_layer_norm_bias +epsilon + + +var_12. +hidden_states_15 +  + +� +�*& +name + +" +hidden_states_15� +linear +x + +hidden_states_15E +weight; +9 +7model_model_decoder_layers_1_encoder_attn_q_proj_weightA +bias9 +7 +5model_model_decoder_layers_1_encoder_attn_q_proj_bias' + linear_14 +  + +� +�* +name + + " + linear_14Q +const +var_366 + * +name + + +" +op_366* +val +  + + + +>u +mul +x + + linear_14 +y + +var_366' + tensor_23 +  + +� +�* +name + + " + tensor_23� +linear" +x + +encoder_last_hidden_stateE +weight; +9 +7model_model_decoder_layers_1_encoder_attn_k_proj_weightA +bias9 +7 +5model_model_decoder_layers_1_encoder_attn_k_proj_bias' + linear_15 +  + +� +�* +name + + " + linear_15j +const +var_371 + + +* +name + + +" +op_371** +val# + + + + + ���������@} +reshape +x + + linear_15 +shape + +var_371* +var_372 +  + +� + +@* +name + + +" +op_372o +const +var_373_perm_0 + + +*# +name + +" + op_373_perm_0*! +val + + + + + +� +linear" +x + +encoder_last_hidden_stateE +weight; +9 +7model_model_decoder_layers_1_encoder_attn_v_proj_weightA +bias9 +7 +5model_model_decoder_layers_1_encoder_attn_v_proj_bias' + linear_16 +  + +� +�* +name + + " + linear_16j +const +var_378 + + +* +name + + +" +op_378** +val# + + + + + ���������@} +reshape +x + + linear_16 +shape + +var_378* +var_379 +  + +� + +@* +name + + +" +op_379o +const +var_380_perm_0 + + +*# +name + +" + op_380_perm_0*! +val + + + + + +b +const +var_387 + + +* +name + + +" +op_387*" +val + + + +  +�@} +reshape +x + + tensor_23 +shape + +var_387* +var_388 +  + +� + +@* +name + + +" +op_388o +const +var_389_perm_0 + + +*# +name + +" + op_389_perm_0*! +val + + + + + +i +const +var_391 + + +* +name + + +" +op_391*) +val" + + + + + ���������@� + transpose +x + +var_388 +perm + +var_389_perm_0/ + transpose_42 +  + + +� +@*" +name + +" + transpose_42� +reshape +x + + transpose_42 +shape + +var_391+ +query_states_7 +  + +� +@*$ +name + +" +query_states_7i +const +var_393 + + +* +name + + +" +op_393*) +val" + + + + + ���������@� + transpose +x + +var_372 +perm + +var_373_perm_0/ + transpose_44 +  + + +� +@*" +name + +" + transpose_44� +reshape +x + + transpose_44 +shape + +var_393* + key_states_15 +  + +� +@*# +name + +" + key_states_15i +const +var_395 + + +* +name + + +" +op_395*) +val" + + + + + ���������@� + transpose +x + +var_379 +perm + +var_380_perm_0/ + transpose_43 +  + + +� +@*" +name + +" + transpose_43� +reshape +x + + transpose_43 +shape + +var_395, +value_states_15 +  + +� +@*% +name + +" +value_states_15n +const +var_398_perm_0 + + +*# +name + +" + op_398_perm_0* +val + + + + +{ +const% +attn_weights_19_transpose_x_0 +*3 +name+ +# +!" +attn_weights_19_transpose_x_0* +val + + +{ +const% +attn_weights_19_transpose_y_0 +*3 +name+ +# +!" +attn_weights_19_transpose_y_0* +val + + +� + transpose +x + + key_states_15 +perm + +var_398_perm_0) + transpose_41 +  + +@ +�*" +name + +" + transpose_41� +matmul +x + +query_states_7 +y + + transpose_410 + transpose_x! + +attn_weights_19_transpose_x_00 + transpose_y! + +attn_weights_19_transpose_y_0- +attn_weights_19 +  + +� +�*% +name + +" +attn_weights_19c +const +var_400 + + +* +name + + +" +op_400*# +val + + + + + +��� +reshape +x + +attn_weights_19 +shape + +var_400+ +var_401 +  + + +� +�* +name + + +" +op_401� +add +x + +var_401 +y + +attention_mask3 +attn_weights_21 +  + + +� +�*% +name + +" +attn_weights_21b +const +var_406 + + +* +name + + +" +op_406*" +val + + + +  +��� +reshape +x + +attn_weights_21 +shape + +var_406& +input_51 +  + +� +�* +name + + " + +input_51x +softmax +x + + +input_51 +axis + + +var_21& +input_53 +  + +� +�* +name + + " + +input_53y +const$ +attn_output_19_transpose_x_0 +*2 +name* +" + " +attn_output_19_transpose_x_0* +val + + +y +const$ +attn_output_19_transpose_y_0 +*2 +name* +" + " +attn_output_19_transpose_y_0* +val + + +� +matmul +x + + +input_53 +y + +value_states_15/ + transpose_x + +attn_output_19_transpose_x_0/ + transpose_y + +attn_output_19_transpose_y_0+ +attn_output_19 +  + +� +@*$ +name + +" +attn_output_19b +const +var_411 + + +* +name + + +" +op_411*" +val + + + +  +�@� +reshape +x + +attn_output_19 +shape + +var_4111 +attn_output_21 +  + + +� +@*$ +name + +" +attn_output_21~ +const% +attn_output_23_perm_0 + + +*+ +name# + +" +attn_output_23_perm_0*! +val + + + + + +b +const +var_414 + + +* +name + + +" +op_414*" +val + + + +  +��� + transpose +x + +attn_output_21! +perm + +attn_output_23_perm_0/ + transpose_40 +  + +� + +@*" +name + +" + transpose_40~ +reshape +x + + transpose_40 +shape + +var_414& +input_55 +  + +� +�* +name + + " + +input_55� +linear +x + + +input_55G +weight= +; +9model_model_decoder_layers_1_encoder_attn_out_proj_weightC +bias; +9 +7model_model_decoder_layers_1_encoder_attn_out_proj_bias' + linear_17 +  + +� +�* +name + + " + linear_17| +add +x + +hidden_states_15 +y + + linear_17& +input_59 +  + +� +�* +name + + " + +input_59x +const +input_61_axes_0 + + +*% +name + +" +input_61_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + +input_59 +axes + +input_61_axes_0H +gamma? += +;model_model_decoder_layers_1_encoder_attn_layer_norm_weightE +beta= +; +9model_model_decoder_layers_1_encoder_attn_layer_norm_bias +epsilon + + +var_12& +input_61 +  + +� +�* +name + + " + +input_61� +linear +x + + +input_615 +weight+ +) +'model_model_decoder_layers_1_fc1_weight1 +bias) +' +%model_model_decoder_layers_1_fc1_bias' + linear_18 +  + +� +� * +name + + " + linear_18c +const +input_65_mode_0 +*% +name + +" +input_65_mode_0* +val + + " +EXACT +gelu +x + + linear_18 +mode + +input_65_mode_0& +input_65 +  + +� +� * +name + + " + +input_65� +linear +x + + +input_655 +weight+ +) +'model_model_decoder_layers_1_fc2_weight1 +bias) +' +%model_model_decoder_layers_1_fc2_bias' + linear_19 +  + +� +�* +name + + " + linear_19t +add +x + + +input_61 +y + + linear_19& +input_71 +  + +� +�* +name + + " + +input_71� +const' +hidden_states_21_axes_0 + + +*- +name% + +" +hidden_states_21_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + +input_71# +axes + +hidden_states_21_axes_0A +gamma8 +6 +4model_model_decoder_layers_1_final_layer_norm_weight> +beta6 +4 +2model_model_decoder_layers_1_final_layer_norm_bias +epsilon + + +var_12. +hidden_states_21 +  + +� +�*& +name + +" +hidden_states_21� +linear +x + +hidden_states_21B +weight8 +6 +4model_model_decoder_layers_2_self_attn_q_proj_weight> +bias6 +4 +2model_model_decoder_layers_2_self_attn_q_proj_bias' + linear_20 +  + +� +�* +name + + " + linear_20Q +const +var_456 + * +name + + +" +op_456* +val +  + + + +>u +mul +x + + linear_20 +y + +var_456' + tensor_29 +  + +� +�* +name + + " + tensor_29� +linear +x + +hidden_states_21B +weight8 +6 +4model_model_decoder_layers_2_self_attn_k_proj_weight> +bias6 +4 +2model_model_decoder_layers_2_self_attn_k_proj_bias' + linear_21 +  + +� +�* +name + + " + linear_21j +const +var_461 + + +* +name + + +" +op_461** +val# + + + + + ���������@} +reshape +x + + linear_21 +shape + +var_461* +var_462 +  + +� + +@* +name + + +" +op_462o +const +var_463_perm_0 + + +*# +name + +" + op_463_perm_0*! +val + + + + + +� +linear +x + +hidden_states_21B +weight8 +6 +4model_model_decoder_layers_2_self_attn_v_proj_weight> +bias6 +4 +2model_model_decoder_layers_2_self_attn_v_proj_bias' + linear_22 +  + +� +�* +name + + " + linear_22j +const +var_468 + + +* +name + + +" +op_468** +val# + + + + + ���������@} +reshape +x + + linear_22 +shape + +var_468* +var_469 +  + +� + +@* +name + + +" +op_469o +const +var_470_perm_0 + + +*# +name + +" + op_470_perm_0*! +val + + + + + +b +const +var_477 + + +* +name + + +" +op_477*" +val + + + +  +�@} +reshape +x + + tensor_29 +shape + +var_477* +var_478 +  + +� + +@* +name + + +" +op_478o +const +var_479_perm_0 + + +*# +name + +" + op_479_perm_0*! +val + + + + + +i +const +var_481 + + +* +name + + +" +op_481*) +val" + + + + + ���������@� + transpose +x + +var_478 +perm + +var_479_perm_0/ + transpose_37 +  + + +� +@*" +name + +" + transpose_37� +reshape +x + + transpose_37 +shape + +var_481+ +query_states_9 +  + +� +@*$ +name + +" +query_states_9i +const +var_483 + + +* +name + + +" +op_483*) +val" + + + + + ���������@� + transpose +x + +var_462 +perm + +var_463_perm_0/ + transpose_39 +  + + +� +@*" +name + +" + transpose_39� +reshape +x + + transpose_39 +shape + +var_483* + key_states_19 +  + +� +@*# +name + +" + key_states_19i +const +var_485 + + +* +name + + +" +op_485*) +val" + + + + + ���������@� + transpose +x + +var_469 +perm + +var_470_perm_0/ + transpose_38 +  + + +� +@*" +name + +" + transpose_38� +reshape +x + + transpose_38 +shape + +var_485, +value_states_19 +  + +� +@*% +name + +" +value_states_19n +const +var_488_perm_0 + + +*# +name + +" + op_488_perm_0* +val + + + + +{ +const% +attn_weights_25_transpose_x_0 +*3 +name+ +# +!" +attn_weights_25_transpose_x_0* +val + + +{ +const% +attn_weights_25_transpose_y_0 +*3 +name+ +# +!" +attn_weights_25_transpose_y_0* +val + + +� + transpose +x + + key_states_19 +perm + +var_488_perm_0) + transpose_36 +  + +@ +�*" +name + +" + transpose_36� +matmul +x + +query_states_9 +y + + transpose_360 + transpose_x! + +attn_weights_25_transpose_x_00 + transpose_y! + +attn_weights_25_transpose_y_0- +attn_weights_25 +  + +� +�*% +name + +" +attn_weights_25c +const +var_490 + + +* +name + + +" +op_490*# +val + + + + + +��� +reshape +x + +attn_weights_25 +shape + +var_490+ +var_491 +  + + +� +�* +name + + +" +op_491� +add +x + +var_491 +y + +attention_mask_13 +attn_weights_27 +  + + +� +�*% +name + +" +attn_weights_27b +const +var_496 + + +* +name + + +" +op_496*" +val + + + +  +��� +reshape +x + +attn_weights_27 +shape + +var_496& +input_73 +  + +� +�* +name + + " + +input_73x +softmax +x + + +input_73 +axis + + +var_21& +input_75 +  + +� +�* +name + + " + +input_75y +const$ +attn_output_25_transpose_x_0 +*2 +name* +" + " +attn_output_25_transpose_x_0* +val + + +y +const$ +attn_output_25_transpose_y_0 +*2 +name* +" + " +attn_output_25_transpose_y_0* +val + + +� +matmul +x + + +input_75 +y + +value_states_19/ + transpose_x + +attn_output_25_transpose_x_0/ + transpose_y + +attn_output_25_transpose_y_0+ +attn_output_25 +  + +� +@*$ +name + +" +attn_output_25b +const +var_501 + + +* +name + + +" +op_501*" +val + + + +  +�@� +reshape +x + +attn_output_25 +shape + +var_5011 +attn_output_27 +  + + +� +@*$ +name + +" +attn_output_27~ +const% +attn_output_29_perm_0 + + +*+ +name# + +" +attn_output_29_perm_0*! +val + + + + + +b +const +var_504 + + +* +name + + +" +op_504*" +val + + + +  +��� + transpose +x + +attn_output_27! +perm + +attn_output_29_perm_0/ + transpose_35 +  + +� + +@*" +name + +" + transpose_35~ +reshape +x + + transpose_35 +shape + +var_504& +input_77 +  + +� +�* +name + + " + +input_77� +linear +x + + +input_77D +weight: +8 +6model_model_decoder_layers_2_self_attn_out_proj_weight@ +bias8 +6 +4model_model_decoder_layers_2_self_attn_out_proj_bias' + linear_23 +  + +� +�* +name + + " + linear_23| +add +x + +hidden_states_21 +y + + linear_23& +input_81 +  + +� +�* +name + + " + +input_81� +const' +hidden_states_25_axes_0 + + +*- +name% + +" +hidden_states_25_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + +input_81# +axes + +hidden_states_25_axes_0E +gamma< +: +8model_model_decoder_layers_2_self_attn_layer_norm_weightB +beta: +8 +6model_model_decoder_layers_2_self_attn_layer_norm_bias +epsilon + + +var_12. +hidden_states_25 +  + +� +�*& +name + +" +hidden_states_25� +linear +x + +hidden_states_25E +weight; +9 +7model_model_decoder_layers_2_encoder_attn_q_proj_weightA +bias9 +7 +5model_model_decoder_layers_2_encoder_attn_q_proj_bias' + linear_24 +  + +� +�* +name + + " + linear_24Q +const +var_525 + * +name + + +" +op_525* +val +  + + + +>u +mul +x + + linear_24 +y + +var_525' + tensor_35 +  + +� +�* +name + + " + tensor_35� +linear" +x + +encoder_last_hidden_stateE +weight; +9 +7model_model_decoder_layers_2_encoder_attn_k_proj_weightA +bias9 +7 +5model_model_decoder_layers_2_encoder_attn_k_proj_bias' + linear_25 +  + +� +�* +name + + " + linear_25j +const +var_530 + + +* +name + + +" +op_530** +val# + + + + + ���������@} +reshape +x + + linear_25 +shape + +var_530* +var_531 +  + +� + +@* +name + + +" +op_531o +const +var_532_perm_0 + + +*# +name + +" + op_532_perm_0*! +val + + + + + +� +linear" +x + +encoder_last_hidden_stateE +weight; +9 +7model_model_decoder_layers_2_encoder_attn_v_proj_weightA +bias9 +7 +5model_model_decoder_layers_2_encoder_attn_v_proj_bias' + linear_26 +  + +� +�* +name + + " + linear_26j +const +var_537 + + +* +name + + +" +op_537** +val# + + + + + ���������@} +reshape +x + + linear_26 +shape + +var_537* +var_538 +  + +� + +@* +name + + +" +op_538o +const +var_539_perm_0 + + +*# +name + +" + op_539_perm_0*! +val + + + + + +b +const +var_546 + + +* +name + + +" +op_546*" +val + + + +  +�@} +reshape +x + + tensor_35 +shape + +var_546* +var_547 +  + +� + +@* +name + + +" +op_547o +const +var_548_perm_0 + + +*# +name + +" + op_548_perm_0*! +val + + + + + +i +const +var_550 + + +* +name + + +" +op_550*) +val" + + + + + ���������@� + transpose +x + +var_547 +perm + +var_548_perm_0/ + transpose_32 +  + + +� +@*" +name + +" + transpose_32� +reshape +x + + transpose_32 +shape + +var_550, +query_states_11 +  + +� +@*% +name + +" +query_states_11i +const +var_552 + + +* +name + + +" +op_552*) +val" + + + + + ���������@� + transpose +x + +var_531 +perm + +var_532_perm_0/ + transpose_34 +  + + +� +@*" +name + +" + transpose_34� +reshape +x + + transpose_34 +shape + +var_552* + key_states_23 +  + +� +@*# +name + +" + key_states_23i +const +var_554 + + +* +name + + +" +op_554*) +val" + + + + + ���������@� + transpose +x + +var_538 +perm + +var_539_perm_0/ + transpose_33 +  + + +� +@*" +name + +" + transpose_33� +reshape +x + + transpose_33 +shape + +var_554, +value_states_23 +  + +� +@*% +name + +" +value_states_23n +const +var_557_perm_0 + + +*# +name + +" + op_557_perm_0* +val + + + + +{ +const% +attn_weights_31_transpose_x_0 +*3 +name+ +# +!" +attn_weights_31_transpose_x_0* +val + + +{ +const% +attn_weights_31_transpose_y_0 +*3 +name+ +# +!" +attn_weights_31_transpose_y_0* +val + + +� + transpose +x + + key_states_23 +perm + +var_557_perm_0) + transpose_31 +  + +@ +�*" +name + +" + transpose_31� +matmul +x + +query_states_11 +y + + transpose_310 + transpose_x! + +attn_weights_31_transpose_x_00 + transpose_y! + +attn_weights_31_transpose_y_0- +attn_weights_31 +  + +� +�*% +name + +" +attn_weights_31c +const +var_559 + + +* +name + + +" +op_559*# +val + + + + + +��� +reshape +x + +attn_weights_31 +shape + +var_559+ +var_560 +  + + +� +�* +name + + +" +op_560� +add +x + +var_560 +y + +attention_mask3 +attn_weights_33 +  + + +� +�*% +name + +" +attn_weights_33b +const +var_565 + + +* +name + + +" +op_565*" +val + + + +  +��� +reshape +x + +attn_weights_33 +shape + +var_565& +input_83 +  + +� +�* +name + + " + +input_83x +softmax +x + + +input_83 +axis + + +var_21& +input_85 +  + +� +�* +name + + " + +input_85y +const$ +attn_output_31_transpose_x_0 +*2 +name* +" + " +attn_output_31_transpose_x_0* +val + + +y +const$ +attn_output_31_transpose_y_0 +*2 +name* +" + " +attn_output_31_transpose_y_0* +val + + +� +matmul +x + + +input_85 +y + +value_states_23/ + transpose_x + +attn_output_31_transpose_x_0/ + transpose_y + +attn_output_31_transpose_y_0+ +attn_output_31 +  + +� +@*$ +name + +" +attn_output_31b +const +var_570 + + +* +name + + +" +op_570*" +val + + + +  +�@� +reshape +x + +attn_output_31 +shape + +var_5701 +attn_output_33 +  + + +� +@*$ +name + +" +attn_output_33~ +const% +attn_output_35_perm_0 + + +*+ +name# + +" +attn_output_35_perm_0*! +val + + + + + +b +const +var_573 + + +* +name + + +" +op_573*" +val + + + +  +��� + transpose +x + +attn_output_33! +perm + +attn_output_35_perm_0/ + transpose_30 +  + +� + +@*" +name + +" + transpose_30~ +reshape +x + + transpose_30 +shape + +var_573& +input_87 +  + +� +�* +name + + " + +input_87� +linear +x + + +input_87G +weight= +; +9model_model_decoder_layers_2_encoder_attn_out_proj_weightC +bias; +9 +7model_model_decoder_layers_2_encoder_attn_out_proj_bias' + linear_27 +  + +� +�* +name + + " + linear_27| +add +x + +hidden_states_25 +y + + linear_27& +input_91 +  + +� +�* +name + + " + +input_91x +const +input_93_axes_0 + + +*% +name + +" +input_93_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + +input_91 +axes + +input_93_axes_0H +gamma? += +;model_model_decoder_layers_2_encoder_attn_layer_norm_weightE +beta= +; +9model_model_decoder_layers_2_encoder_attn_layer_norm_bias +epsilon + + +var_12& +input_93 +  + +� +�* +name + + " + +input_93� +linear +x + + +input_935 +weight+ +) +'model_model_decoder_layers_2_fc1_weight1 +bias) +' +%model_model_decoder_layers_2_fc1_bias' + linear_28 +  + +� +� * +name + + " + linear_28c +const +input_97_mode_0 +*% +name + +" +input_97_mode_0* +val + + " +EXACT +gelu +x + + linear_28 +mode + +input_97_mode_0& +input_97 +  + +� +� * +name + + " + +input_97� +linear +x + + +input_975 +weight+ +) +'model_model_decoder_layers_2_fc2_weight1 +bias) +' +%model_model_decoder_layers_2_fc2_bias' + linear_29 +  + +� +�* +name + + " + linear_29v +add +x + + +input_93 +y + + linear_29' + input_103 +  + +� +�* +name + + " + input_103� +const' +hidden_states_31_axes_0 + + +*- +name% + +" +hidden_states_31_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + input_103# +axes + +hidden_states_31_axes_0A +gamma8 +6 +4model_model_decoder_layers_2_final_layer_norm_weight> +beta6 +4 +2model_model_decoder_layers_2_final_layer_norm_bias +epsilon + + +var_12. +hidden_states_31 +  + +� +�*& +name + +" +hidden_states_31� +linear +x + +hidden_states_31B +weight8 +6 +4model_model_decoder_layers_3_self_attn_q_proj_weight> +bias6 +4 +2model_model_decoder_layers_3_self_attn_q_proj_bias' + linear_30 +  + +� +�* +name + + " + linear_30Q +const +var_615 + * +name + + +" +op_615* +val +  + + + +>u +mul +x + + linear_30 +y + +var_615' + tensor_41 +  + +� +�* +name + + " + tensor_41� +linear +x + +hidden_states_31B +weight8 +6 +4model_model_decoder_layers_3_self_attn_k_proj_weight> +bias6 +4 +2model_model_decoder_layers_3_self_attn_k_proj_bias' + linear_31 +  + +� +�* +name + + " + linear_31j +const +var_620 + + +* +name + + +" +op_620** +val# + + + + + ���������@} +reshape +x + + linear_31 +shape + +var_620* +var_621 +  + +� + +@* +name + + +" +op_621o +const +var_622_perm_0 + + +*# +name + +" + op_622_perm_0*! +val + + + + + +� +linear +x + +hidden_states_31B +weight8 +6 +4model_model_decoder_layers_3_self_attn_v_proj_weight> +bias6 +4 +2model_model_decoder_layers_3_self_attn_v_proj_bias' + linear_32 +  + +� +�* +name + + " + linear_32j +const +var_627 + + +* +name + + +" +op_627** +val# + + + + + ���������@} +reshape +x + + linear_32 +shape + +var_627* +var_628 +  + +� + +@* +name + + +" +op_628o +const +var_629_perm_0 + + +*# +name + +" + op_629_perm_0*! +val + + + + + +b +const +var_636 + + +* +name + + +" +op_636*" +val + + + +  +�@} +reshape +x + + tensor_41 +shape + +var_636* +var_637 +  + +� + +@* +name + + +" +op_637o +const +var_638_perm_0 + + +*# +name + +" + op_638_perm_0*! +val + + + + + +i +const +var_640 + + +* +name + + +" +op_640*) +val" + + + + + ���������@� + transpose +x + +var_637 +perm + +var_638_perm_0/ + transpose_27 +  + + +� +@*" +name + +" + transpose_27� +reshape +x + + transpose_27 +shape + +var_640, +query_states_13 +  + +� +@*% +name + +" +query_states_13i +const +var_642 + + +* +name + + +" +op_642*) +val" + + + + + ���������@� + transpose +x + +var_621 +perm + +var_622_perm_0/ + transpose_29 +  + + +� +@*" +name + +" + transpose_29� +reshape +x + + transpose_29 +shape + +var_642* + key_states_27 +  + +� +@*# +name + +" + key_states_27i +const +var_644 + + +* +name + + +" +op_644*) +val" + + + + + ���������@� + transpose +x + +var_628 +perm + +var_629_perm_0/ + transpose_28 +  + + +� +@*" +name + +" + transpose_28� +reshape +x + + transpose_28 +shape + +var_644, +value_states_27 +  + +� +@*% +name + +" +value_states_27n +const +var_647_perm_0 + + +*# +name + +" + op_647_perm_0* +val + + + + +{ +const% +attn_weights_37_transpose_x_0 +*3 +name+ +# +!" +attn_weights_37_transpose_x_0* +val + + +{ +const% +attn_weights_37_transpose_y_0 +*3 +name+ +# +!" +attn_weights_37_transpose_y_0* +val + + +� + transpose +x + + key_states_27 +perm + +var_647_perm_0) + transpose_26 +  + +@ +�*" +name + +" + transpose_26� +matmul +x + +query_states_13 +y + + transpose_260 + transpose_x! + +attn_weights_37_transpose_x_00 + transpose_y! + +attn_weights_37_transpose_y_0- +attn_weights_37 +  + +� +�*% +name + +" +attn_weights_37c +const +var_649 + + +* +name + + +" +op_649*# +val + + + + + +��� +reshape +x + +attn_weights_37 +shape + +var_649+ +var_650 +  + + +� +�* +name + + +" +op_650� +add +x + +var_650 +y + +attention_mask_13 +attn_weights_39 +  + + +� +�*% +name + +" +attn_weights_39b +const +var_655 + + +* +name + + +" +op_655*" +val + + + +  +��� +reshape +x + +attn_weights_39 +shape + +var_655' + input_105 +  + +� +�* +name + + " + input_105{ +softmax +x + + input_105 +axis + + +var_21' + input_107 +  + +� +�* +name + + " + input_107y +const$ +attn_output_37_transpose_x_0 +*2 +name* +" + " +attn_output_37_transpose_x_0* +val + + +y +const$ +attn_output_37_transpose_y_0 +*2 +name* +" + " +attn_output_37_transpose_y_0* +val + + +� +matmul +x + + input_107 +y + +value_states_27/ + transpose_x + +attn_output_37_transpose_x_0/ + transpose_y + +attn_output_37_transpose_y_0+ +attn_output_37 +  + +� +@*$ +name + +" +attn_output_37b +const +var_660 + + +* +name + + +" +op_660*" +val + + + +  +�@� +reshape +x + +attn_output_37 +shape + +var_6601 +attn_output_39 +  + + +� +@*$ +name + +" +attn_output_39~ +const% +attn_output_41_perm_0 + + +*+ +name# + +" +attn_output_41_perm_0*! +val + + + + + +b +const +var_663 + + +* +name + + +" +op_663*" +val + + + +  +��� + transpose +x + +attn_output_39! +perm + +attn_output_41_perm_0/ + transpose_25 +  + +� + +@*" +name + +" + transpose_25� +reshape +x + + transpose_25 +shape + +var_663' + input_109 +  + +� +�* +name + + " + input_109� +linear +x + + input_109D +weight: +8 +6model_model_decoder_layers_3_self_attn_out_proj_weight@ +bias8 +6 +4model_model_decoder_layers_3_self_attn_out_proj_bias' + linear_33 +  + +� +�* +name + + " + linear_33~ +add +x + +hidden_states_31 +y + + linear_33' + input_113 +  + +� +�* +name + + " + input_113� +const' +hidden_states_35_axes_0 + + +*- +name% + +" +hidden_states_35_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + input_113# +axes + +hidden_states_35_axes_0E +gamma< +: +8model_model_decoder_layers_3_self_attn_layer_norm_weightB +beta: +8 +6model_model_decoder_layers_3_self_attn_layer_norm_bias +epsilon + + +var_12. +hidden_states_35 +  + +� +�*& +name + +" +hidden_states_35� +linear +x + +hidden_states_35E +weight; +9 +7model_model_decoder_layers_3_encoder_attn_q_proj_weightA +bias9 +7 +5model_model_decoder_layers_3_encoder_attn_q_proj_bias' + linear_34 +  + +� +�* +name + + " + linear_34Q +const +var_684 + * +name + + +" +op_684* +val +  + + + +>u +mul +x + + linear_34 +y + +var_684' + tensor_47 +  + +� +�* +name + + " + tensor_47� +linear" +x + +encoder_last_hidden_stateE +weight; +9 +7model_model_decoder_layers_3_encoder_attn_k_proj_weightA +bias9 +7 +5model_model_decoder_layers_3_encoder_attn_k_proj_bias' + linear_35 +  + +� +�* +name + + " + linear_35j +const +var_689 + + +* +name + + +" +op_689** +val# + + + + + ���������@} +reshape +x + + linear_35 +shape + +var_689* +var_690 +  + +� + +@* +name + + +" +op_690o +const +var_691_perm_0 + + +*# +name + +" + op_691_perm_0*! +val + + + + + +� +linear" +x + +encoder_last_hidden_stateE +weight; +9 +7model_model_decoder_layers_3_encoder_attn_v_proj_weightA +bias9 +7 +5model_model_decoder_layers_3_encoder_attn_v_proj_bias' + linear_36 +  + +� +�* +name + + " + linear_36j +const +var_696 + + +* +name + + +" +op_696** +val# + + + + + ���������@} +reshape +x + + linear_36 +shape + +var_696* +var_697 +  + +� + +@* +name + + +" +op_697o +const +var_698_perm_0 + + +*# +name + +" + op_698_perm_0*! +val + + + + + +b +const +var_705 + + +* +name + + +" +op_705*" +val + + + +  +�@} +reshape +x + + tensor_47 +shape + +var_705* +var_706 +  + +� + +@* +name + + +" +op_706o +const +var_707_perm_0 + + +*# +name + +" + op_707_perm_0*! +val + + + + + +i +const +var_709 + + +* +name + + +" +op_709*) +val" + + + + + ���������@� + transpose +x + +var_706 +perm + +var_707_perm_0/ + transpose_22 +  + + +� +@*" +name + +" + transpose_22� +reshape +x + + transpose_22 +shape + +var_709, +query_states_15 +  + +� +@*% +name + +" +query_states_15i +const +var_711 + + +* +name + + +" +op_711*) +val" + + + + + ���������@� + transpose +x + +var_690 +perm + +var_691_perm_0/ + transpose_24 +  + + +� +@*" +name + +" + transpose_24� +reshape +x + + transpose_24 +shape + +var_711* + key_states_31 +  + +� +@*# +name + +" + key_states_31i +const +var_713 + + +* +name + + +" +op_713*) +val" + + + + + ���������@� + transpose +x + +var_697 +perm + +var_698_perm_0/ + transpose_23 +  + + +� +@*" +name + +" + transpose_23� +reshape +x + + transpose_23 +shape + +var_713, +value_states_31 +  + +� +@*% +name + +" +value_states_31n +const +var_716_perm_0 + + +*# +name + +" + op_716_perm_0* +val + + + + +{ +const% +attn_weights_43_transpose_x_0 +*3 +name+ +# +!" +attn_weights_43_transpose_x_0* +val + + +{ +const% +attn_weights_43_transpose_y_0 +*3 +name+ +# +!" +attn_weights_43_transpose_y_0* +val + + +� + transpose +x + + key_states_31 +perm + +var_716_perm_0) + transpose_21 +  + +@ +�*" +name + +" + transpose_21� +matmul +x + +query_states_15 +y + + transpose_210 + transpose_x! + +attn_weights_43_transpose_x_00 + transpose_y! + +attn_weights_43_transpose_y_0- +attn_weights_43 +  + +� +�*% +name + +" +attn_weights_43c +const +var_718 + + +* +name + + +" +op_718*# +val + + + + + +��� +reshape +x + +attn_weights_43 +shape + +var_718+ +var_719 +  + + +� +�* +name + + +" +op_719� +add +x + +var_719 +y + +attention_mask3 +attn_weights_45 +  + + +� +�*% +name + +" +attn_weights_45b +const +var_724 + + +* +name + + +" +op_724*" +val + + + +  +��� +reshape +x + +attn_weights_45 +shape + +var_724' + input_115 +  + +� +�* +name + + " + input_115{ +softmax +x + + input_115 +axis + + +var_21' + input_117 +  + +� +�* +name + + " + input_117y +const$ +attn_output_43_transpose_x_0 +*2 +name* +" + " +attn_output_43_transpose_x_0* +val + + +y +const$ +attn_output_43_transpose_y_0 +*2 +name* +" + " +attn_output_43_transpose_y_0* +val + + +� +matmul +x + + input_117 +y + +value_states_31/ + transpose_x + +attn_output_43_transpose_x_0/ + transpose_y + +attn_output_43_transpose_y_0+ +attn_output_43 +  + +� +@*$ +name + +" +attn_output_43b +const +var_729 + + +* +name + + +" +op_729*" +val + + + +  +�@� +reshape +x + +attn_output_43 +shape + +var_7291 +attn_output_45 +  + + +� +@*$ +name + +" +attn_output_45~ +const% +attn_output_47_perm_0 + + +*+ +name# + +" +attn_output_47_perm_0*! +val + + + + + +b +const +var_732 + + +* +name + + +" +op_732*" +val + + + +  +��� + transpose +x + +attn_output_45! +perm + +attn_output_47_perm_0/ + transpose_20 +  + +� + +@*" +name + +" + transpose_20� +reshape +x + + transpose_20 +shape + +var_732' + input_119 +  + +� +�* +name + + " + input_119� +linear +x + + input_119G +weight= +; +9model_model_decoder_layers_3_encoder_attn_out_proj_weightC +bias; +9 +7model_model_decoder_layers_3_encoder_attn_out_proj_bias' + linear_37 +  + +� +�* +name + + " + linear_37~ +add +x + +hidden_states_35 +y + + linear_37' + input_123 +  + +� +�* +name + + " + input_123z +const +input_125_axes_0 + + +*& +name + +" +input_125_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + input_123 +axes + +input_125_axes_0H +gamma? += +;model_model_decoder_layers_3_encoder_attn_layer_norm_weightE +beta= +; +9model_model_decoder_layers_3_encoder_attn_layer_norm_bias +epsilon + + +var_12' + input_125 +  + +� +�* +name + + " + input_125� +linear +x + + input_1255 +weight+ +) +'model_model_decoder_layers_3_fc1_weight1 +bias) +' +%model_model_decoder_layers_3_fc1_bias' + linear_38 +  + +� +� * +name + + " + linear_38e +const +input_129_mode_0 +*& +name + +" +input_129_mode_0* +val + + " +EXACT� +gelu +x + + linear_38 +mode + +input_129_mode_0' + input_129 +  + +� +� * +name + + " + input_129� +linear +x + + input_1295 +weight+ +) +'model_model_decoder_layers_3_fc2_weight1 +bias) +' +%model_model_decoder_layers_3_fc2_bias' + linear_39 +  + +� +�* +name + + " + linear_39w +add +x + + input_125 +y + + linear_39' + input_135 +  + +� +�* +name + + " + input_135� +const' +hidden_states_41_axes_0 + + +*- +name% + +" +hidden_states_41_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + input_135# +axes + +hidden_states_41_axes_0A +gamma8 +6 +4model_model_decoder_layers_3_final_layer_norm_weight> +beta6 +4 +2model_model_decoder_layers_3_final_layer_norm_bias +epsilon + + +var_12. +hidden_states_41 +  + +� +�*& +name + +" +hidden_states_41� +linear +x + +hidden_states_41B +weight8 +6 +4model_model_decoder_layers_4_self_attn_q_proj_weight> +bias6 +4 +2model_model_decoder_layers_4_self_attn_q_proj_bias' + linear_40 +  + +� +�* +name + + " + linear_40Q +const +var_774 + * +name + + +" +op_774* +val +  + + + +>u +mul +x + + linear_40 +y + +var_774' + tensor_53 +  + +� +�* +name + + " + tensor_53� +linear +x + +hidden_states_41B +weight8 +6 +4model_model_decoder_layers_4_self_attn_k_proj_weight> +bias6 +4 +2model_model_decoder_layers_4_self_attn_k_proj_bias' + linear_41 +  + +� +�* +name + + " + linear_41j +const +var_779 + + +* +name + + +" +op_779** +val# + + + + + ���������@} +reshape +x + + linear_41 +shape + +var_779* +var_780 +  + +� + +@* +name + + +" +op_780o +const +var_781_perm_0 + + +*# +name + +" + op_781_perm_0*! +val + + + + + +� +linear +x + +hidden_states_41B +weight8 +6 +4model_model_decoder_layers_4_self_attn_v_proj_weight> +bias6 +4 +2model_model_decoder_layers_4_self_attn_v_proj_bias' + linear_42 +  + +� +�* +name + + " + linear_42j +const +var_786 + + +* +name + + +" +op_786** +val# + + + + + ���������@} +reshape +x + + linear_42 +shape + +var_786* +var_787 +  + +� + +@* +name + + +" +op_787o +const +var_788_perm_0 + + +*# +name + +" + op_788_perm_0*! +val + + + + + +b +const +var_795 + + +* +name + + +" +op_795*" +val + + + +  +�@} +reshape +x + + tensor_53 +shape + +var_795* +var_796 +  + +� + +@* +name + + +" +op_796o +const +var_797_perm_0 + + +*# +name + +" + op_797_perm_0*! +val + + + + + +i +const +var_799 + + +* +name + + +" +op_799*) +val" + + + + + ���������@� + transpose +x + +var_796 +perm + +var_797_perm_0/ + transpose_17 +  + + +� +@*" +name + +" + transpose_17� +reshape +x + + transpose_17 +shape + +var_799, +query_states_17 +  + +� +@*% +name + +" +query_states_17i +const +var_801 + + +* +name + + +" +op_801*) +val" + + + + + ���������@� + transpose +x + +var_780 +perm + +var_781_perm_0/ + transpose_19 +  + + +� +@*" +name + +" + transpose_19� +reshape +x + + transpose_19 +shape + +var_801* + key_states_35 +  + +� +@*# +name + +" + key_states_35i +const +var_803 + + +* +name + + +" +op_803*) +val" + + + + + ���������@� + transpose +x + +var_787 +perm + +var_788_perm_0/ + transpose_18 +  + + +� +@*" +name + +" + transpose_18� +reshape +x + + transpose_18 +shape + +var_803, +value_states_35 +  + +� +@*% +name + +" +value_states_35n +const +var_806_perm_0 + + +*# +name + +" + op_806_perm_0* +val + + + + +{ +const% +attn_weights_49_transpose_x_0 +*3 +name+ +# +!" +attn_weights_49_transpose_x_0* +val + + +{ +const% +attn_weights_49_transpose_y_0 +*3 +name+ +# +!" +attn_weights_49_transpose_y_0* +val + + +� + transpose +x + + key_states_35 +perm + +var_806_perm_0) + transpose_16 +  + +@ +�*" +name + +" + transpose_16� +matmul +x + +query_states_17 +y + + transpose_160 + transpose_x! + +attn_weights_49_transpose_x_00 + transpose_y! + +attn_weights_49_transpose_y_0- +attn_weights_49 +  + +� +�*% +name + +" +attn_weights_49c +const +var_808 + + +* +name + + +" +op_808*# +val + + + + + +��� +reshape +x + +attn_weights_49 +shape + +var_808+ +var_809 +  + + +� +�* +name + + +" +op_809� +add +x + +var_809 +y + +attention_mask_13 +attn_weights_51 +  + + +� +�*% +name + +" +attn_weights_51b +const +var_814 + + +* +name + + +" +op_814*" +val + + + +  +��� +reshape +x + +attn_weights_51 +shape + +var_814' + input_137 +  + +� +�* +name + + " + input_137{ +softmax +x + + input_137 +axis + + +var_21' + input_139 +  + +� +�* +name + + " + input_139y +const$ +attn_output_49_transpose_x_0 +*2 +name* +" + " +attn_output_49_transpose_x_0* +val + + +y +const$ +attn_output_49_transpose_y_0 +*2 +name* +" + " +attn_output_49_transpose_y_0* +val + + +� +matmul +x + + input_139 +y + +value_states_35/ + transpose_x + +attn_output_49_transpose_x_0/ + transpose_y + +attn_output_49_transpose_y_0+ +attn_output_49 +  + +� +@*$ +name + +" +attn_output_49b +const +var_819 + + +* +name + + +" +op_819*" +val + + + +  +�@� +reshape +x + +attn_output_49 +shape + +var_8191 +attn_output_51 +  + + +� +@*$ +name + +" +attn_output_51~ +const% +attn_output_53_perm_0 + + +*+ +name# + +" +attn_output_53_perm_0*! +val + + + + + +b +const +var_822 + + +* +name + + +" +op_822*" +val + + + +  +��� + transpose +x + +attn_output_51! +perm + +attn_output_53_perm_0/ + transpose_15 +  + +� + +@*" +name + +" + transpose_15� +reshape +x + + transpose_15 +shape + +var_822' + input_141 +  + +� +�* +name + + " + input_141� +linear +x + + input_141D +weight: +8 +6model_model_decoder_layers_4_self_attn_out_proj_weight@ +bias8 +6 +4model_model_decoder_layers_4_self_attn_out_proj_bias' + linear_43 +  + +� +�* +name + + " + linear_43~ +add +x + +hidden_states_41 +y + + linear_43' + input_145 +  + +� +�* +name + + " + input_145� +const' +hidden_states_45_axes_0 + + +*- +name% + +" +hidden_states_45_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + input_145# +axes + +hidden_states_45_axes_0E +gamma< +: +8model_model_decoder_layers_4_self_attn_layer_norm_weightB +beta: +8 +6model_model_decoder_layers_4_self_attn_layer_norm_bias +epsilon + + +var_12. +hidden_states_45 +  + +� +�*& +name + +" +hidden_states_45� +linear +x + +hidden_states_45E +weight; +9 +7model_model_decoder_layers_4_encoder_attn_q_proj_weightA +bias9 +7 +5model_model_decoder_layers_4_encoder_attn_q_proj_bias' + linear_44 +  + +� +�* +name + + " + linear_44Q +const +var_843 + * +name + + +" +op_843* +val +  + + + +>u +mul +x + + linear_44 +y + +var_843' + tensor_59 +  + +� +�* +name + + " + tensor_59� +linear" +x + +encoder_last_hidden_stateE +weight; +9 +7model_model_decoder_layers_4_encoder_attn_k_proj_weightA +bias9 +7 +5model_model_decoder_layers_4_encoder_attn_k_proj_bias' + linear_45 +  + +� +�* +name + + " + linear_45j +const +var_848 + + +* +name + + +" +op_848** +val# + + + + + ���������@} +reshape +x + + linear_45 +shape + +var_848* +var_849 +  + +� + +@* +name + + +" +op_849o +const +var_850_perm_0 + + +*# +name + +" + op_850_perm_0*! +val + + + + + +� +linear" +x + +encoder_last_hidden_stateE +weight; +9 +7model_model_decoder_layers_4_encoder_attn_v_proj_weightA +bias9 +7 +5model_model_decoder_layers_4_encoder_attn_v_proj_bias' + linear_46 +  + +� +�* +name + + " + linear_46j +const +var_855 + + +* +name + + +" +op_855** +val# + + + + + ���������@} +reshape +x + + linear_46 +shape + +var_855* +var_856 +  + +� + +@* +name + + +" +op_856o +const +var_857_perm_0 + + +*# +name + +" + op_857_perm_0*! +val + + + + + +b +const +var_864 + + +* +name + + +" +op_864*" +val + + + +  +�@} +reshape +x + + tensor_59 +shape + +var_864* +var_865 +  + +� + +@* +name + + +" +op_865o +const +var_866_perm_0 + + +*# +name + +" + op_866_perm_0*! +val + + + + + +i +const +var_868 + + +* +name + + +" +op_868*) +val" + + + + + ���������@� + transpose +x + +var_865 +perm + +var_866_perm_0/ + transpose_12 +  + + +� +@*" +name + +" + transpose_12� +reshape +x + + transpose_12 +shape + +var_868, +query_states_19 +  + +� +@*% +name + +" +query_states_19i +const +var_870 + + +* +name + + +" +op_870*) +val" + + + + + ���������@� + transpose +x + +var_849 +perm + +var_850_perm_0/ + transpose_14 +  + + +� +@*" +name + +" + transpose_14� +reshape +x + + transpose_14 +shape + +var_870* + key_states_39 +  + +� +@*# +name + +" + key_states_39i +const +var_872 + + +* +name + + +" +op_872*) +val" + + + + + ���������@� + transpose +x + +var_856 +perm + +var_857_perm_0/ + transpose_13 +  + + +� +@*" +name + +" + transpose_13� +reshape +x + + transpose_13 +shape + +var_872, +value_states_39 +  + +� +@*% +name + +" +value_states_39n +const +var_875_perm_0 + + +*# +name + +" + op_875_perm_0* +val + + + + +{ +const% +attn_weights_55_transpose_x_0 +*3 +name+ +# +!" +attn_weights_55_transpose_x_0* +val + + +{ +const% +attn_weights_55_transpose_y_0 +*3 +name+ +# +!" +attn_weights_55_transpose_y_0* +val + + +� + transpose +x + + key_states_39 +perm + +var_875_perm_0) + transpose_11 +  + +@ +�*" +name + +" + transpose_11� +matmul +x + +query_states_19 +y + + transpose_110 + transpose_x! + +attn_weights_55_transpose_x_00 + transpose_y! + +attn_weights_55_transpose_y_0- +attn_weights_55 +  + +� +�*% +name + +" +attn_weights_55c +const +var_877 + + +* +name + + +" +op_877*# +val + + + + + +��� +reshape +x + +attn_weights_55 +shape + +var_877+ +var_878 +  + + +� +�* +name + + +" +op_878� +add +x + +var_878 +y + +attention_mask3 +attn_weights_57 +  + + +� +�*% +name + +" +attn_weights_57b +const +var_883 + + +* +name + + +" +op_883*" +val + + + +  +��� +reshape +x + +attn_weights_57 +shape + +var_883' + input_147 +  + +� +�* +name + + " + input_147{ +softmax +x + + input_147 +axis + + +var_21' + input_149 +  + +� +�* +name + + " + input_149y +const$ +attn_output_55_transpose_x_0 +*2 +name* +" + " +attn_output_55_transpose_x_0* +val + + +y +const$ +attn_output_55_transpose_y_0 +*2 +name* +" + " +attn_output_55_transpose_y_0* +val + + +� +matmul +x + + input_149 +y + +value_states_39/ + transpose_x + +attn_output_55_transpose_x_0/ + transpose_y + +attn_output_55_transpose_y_0+ +attn_output_55 +  + +� +@*$ +name + +" +attn_output_55b +const +var_888 + + +* +name + + +" +op_888*" +val + + + +  +�@� +reshape +x + +attn_output_55 +shape + +var_8881 +attn_output_57 +  + + +� +@*$ +name + +" +attn_output_57~ +const% +attn_output_59_perm_0 + + +*+ +name# + +" +attn_output_59_perm_0*! +val + + + + + +b +const +var_891 + + +* +name + + +" +op_891*" +val + + + +  +��� + transpose +x + +attn_output_57! +perm + +attn_output_59_perm_0/ + transpose_10 +  + +� + +@*" +name + +" + transpose_10� +reshape +x + + transpose_10 +shape + +var_891' + input_151 +  + +� +�* +name + + " + input_151� +linear +x + + input_151G +weight= +; +9model_model_decoder_layers_4_encoder_attn_out_proj_weightC +bias; +9 +7model_model_decoder_layers_4_encoder_attn_out_proj_bias' + linear_47 +  + +� +�* +name + + " + linear_47~ +add +x + +hidden_states_45 +y + + linear_47' + input_155 +  + +� +�* +name + + " + input_155z +const +input_157_axes_0 + + +*& +name + +" +input_157_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + input_155 +axes + +input_157_axes_0H +gamma? += +;model_model_decoder_layers_4_encoder_attn_layer_norm_weightE +beta= +; +9model_model_decoder_layers_4_encoder_attn_layer_norm_bias +epsilon + + +var_12' + input_157 +  + +� +�* +name + + " + input_157� +linear +x + + input_1575 +weight+ +) +'model_model_decoder_layers_4_fc1_weight1 +bias) +' +%model_model_decoder_layers_4_fc1_bias' + linear_48 +  + +� +� * +name + + " + linear_48e +const +input_161_mode_0 +*& +name + +" +input_161_mode_0* +val + + " +EXACT� +gelu +x + + linear_48 +mode + +input_161_mode_0' + input_161 +  + +� +� * +name + + " + input_161� +linear +x + + input_1615 +weight+ +) +'model_model_decoder_layers_4_fc2_weight1 +bias) +' +%model_model_decoder_layers_4_fc2_bias' + linear_49 +  + +� +�* +name + + " + linear_49w +add +x + + input_157 +y + + linear_49' + input_167 +  + +� +�* +name + + " + input_167� +const' +hidden_states_51_axes_0 + + +*- +name% + +" +hidden_states_51_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + input_167# +axes + +hidden_states_51_axes_0A +gamma8 +6 +4model_model_decoder_layers_4_final_layer_norm_weight> +beta6 +4 +2model_model_decoder_layers_4_final_layer_norm_bias +epsilon + + +var_12. +hidden_states_51 +  + +� +�*& +name + +" +hidden_states_51� +linear +x + +hidden_states_51B +weight8 +6 +4model_model_decoder_layers_5_self_attn_q_proj_weight> +bias6 +4 +2model_model_decoder_layers_5_self_attn_q_proj_bias' + linear_50 +  + +� +�* +name + + " + linear_50Q +const +var_933 + * +name + + +" +op_933* +val +  + + + +>u +mul +x + + linear_50 +y + +var_933' + tensor_65 +  + +� +�* +name + + " + tensor_65� +linear +x + +hidden_states_51B +weight8 +6 +4model_model_decoder_layers_5_self_attn_k_proj_weight> +bias6 +4 +2model_model_decoder_layers_5_self_attn_k_proj_bias' + linear_51 +  + +� +�* +name + + " + linear_51j +const +var_938 + + +* +name + + +" +op_938** +val# + + + + + ���������@} +reshape +x + + linear_51 +shape + +var_938* +var_939 +  + +� + +@* +name + + +" +op_939o +const +var_940_perm_0 + + +*# +name + +" + op_940_perm_0*! +val + + + + + +� +linear +x + +hidden_states_51B +weight8 +6 +4model_model_decoder_layers_5_self_attn_v_proj_weight> +bias6 +4 +2model_model_decoder_layers_5_self_attn_v_proj_bias' + linear_52 +  + +� +�* +name + + " + linear_52j +const +var_945 + + +* +name + + +" +op_945** +val# + + + + + ���������@} +reshape +x + + linear_52 +shape + +var_945* +var_946 +  + +� + +@* +name + + +" +op_946o +const +var_947_perm_0 + + +*# +name + +" + op_947_perm_0*! +val + + + + + +b +const +var_954 + + +* +name + + +" +op_954*" +val + + + +  +�@} +reshape +x + + tensor_65 +shape + +var_954* +var_955 +  + +� + +@* +name + + +" +op_955o +const +var_956_perm_0 + + +*# +name + +" + op_956_perm_0*! +val + + + + + +i +const +var_958 + + +* +name + + +" +op_958*) +val" + + + + + ���������@� + transpose +x + +var_955 +perm + +var_956_perm_0. + transpose_7 +  + + +� +@*! +name + +" + transpose_7� +reshape +x + + transpose_7 +shape + +var_958, +query_states_21 +  + +� +@*% +name + +" +query_states_21i +const +var_960 + + +* +name + + +" +op_960*) +val" + + + + + ���������@� + transpose +x + +var_939 +perm + +var_940_perm_0. + transpose_9 +  + + +� +@*! +name + +" + transpose_9� +reshape +x + + transpose_9 +shape + +var_960* + key_states_43 +  + +� +@*# +name + +" + key_states_43i +const +var_962 + + +* +name + + +" +op_962*) +val" + + + + + ���������@� + transpose +x + +var_946 +perm + +var_947_perm_0. + transpose_8 +  + + +� +@*! +name + +" + transpose_8� +reshape +x + + transpose_8 +shape + +var_962, +value_states_43 +  + +� +@*% +name + +" +value_states_43n +const +var_965_perm_0 + + +*# +name + +" + op_965_perm_0* +val + + + + +{ +const% +attn_weights_61_transpose_x_0 +*3 +name+ +# +!" +attn_weights_61_transpose_x_0* +val + + +{ +const% +attn_weights_61_transpose_y_0 +*3 +name+ +# +!" +attn_weights_61_transpose_y_0* +val + + +� + transpose +x + + key_states_43 +perm + +var_965_perm_0( + transpose_6 +  + +@ +�*! +name + +" + transpose_6� +matmul +x + +query_states_21 +y + + transpose_60 + transpose_x! + +attn_weights_61_transpose_x_00 + transpose_y! + +attn_weights_61_transpose_y_0- +attn_weights_61 +  + +� +�*% +name + +" +attn_weights_61c +const +var_967 + + +* +name + + +" +op_967*# +val + + + + + +��� +reshape +x + +attn_weights_61 +shape + +var_967+ +var_968 +  + + +� +�* +name + + +" +op_968� +add +x + +var_968 +y + +attention_mask_13 +attn_weights_63 +  + + +� +�*% +name + +" +attn_weights_63b +const +var_973 + + +* +name + + +" +op_973*" +val + + + +  +��� +reshape +x + +attn_weights_63 +shape + +var_973' + input_169 +  + +� +�* +name + + " + input_169{ +softmax +x + + input_169 +axis + + +var_21' + input_171 +  + +� +�* +name + + " + input_171y +const$ +attn_output_61_transpose_x_0 +*2 +name* +" + " +attn_output_61_transpose_x_0* +val + + +y +const$ +attn_output_61_transpose_y_0 +*2 +name* +" + " +attn_output_61_transpose_y_0* +val + + +� +matmul +x + + input_171 +y + +value_states_43/ + transpose_x + +attn_output_61_transpose_x_0/ + transpose_y + +attn_output_61_transpose_y_0+ +attn_output_61 +  + +� +@*$ +name + +" +attn_output_61b +const +var_978 + + +* +name + + +" +op_978*" +val + + + +  +�@� +reshape +x + +attn_output_61 +shape + +var_9781 +attn_output_63 +  + + +� +@*$ +name + +" +attn_output_63~ +const% +attn_output_65_perm_0 + + +*+ +name# + +" +attn_output_65_perm_0*! +val + + + + + +b +const +var_981 + + +* +name + + +" +op_981*" +val + + + +  +��� + transpose +x + +attn_output_63! +perm + +attn_output_65_perm_0. + transpose_5 +  + +� + +@*! +name + +" + transpose_5 +reshape +x + + transpose_5 +shape + +var_981' + input_173 +  + +� +�* +name + + " + input_173� +linear +x + + input_173D +weight: +8 +6model_model_decoder_layers_5_self_attn_out_proj_weight@ +bias8 +6 +4model_model_decoder_layers_5_self_attn_out_proj_bias' + linear_53 +  + +� +�* +name + + " + linear_53~ +add +x + +hidden_states_51 +y + + linear_53' + input_177 +  + +� +�* +name + + " + input_177� +const' +hidden_states_55_axes_0 + + +*- +name% + +" +hidden_states_55_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + input_177# +axes + +hidden_states_55_axes_0E +gamma< +: +8model_model_decoder_layers_5_self_attn_layer_norm_weightB +beta: +8 +6model_model_decoder_layers_5_self_attn_layer_norm_bias +epsilon + + +var_12. +hidden_states_55 +  + +� +�*& +name + +" +hidden_states_55� +linear +x + +hidden_states_55E +weight; +9 +7model_model_decoder_layers_5_encoder_attn_q_proj_weightA +bias9 +7 +5model_model_decoder_layers_5_encoder_attn_q_proj_bias' + linear_54 +  + +� +�* +name + + " + linear_54S +const +var_1002 + * +name + + " +op_1002* +val +  + + + +>� +mul +x + + linear_54 +y + + +var_1002/ +tensor_workaround +  + +� +�*' +name + +" +tensor_workaround� +linear" +x + +encoder_last_hidden_stateE +weight; +9 +7model_model_decoder_layers_5_encoder_attn_k_proj_weightA +bias9 +7 +5model_model_decoder_layers_5_encoder_attn_k_proj_bias' + linear_55 +  + +� +�* +name + + " + linear_55l +const +var_1007 + + +* +name + + " +op_1007** +val# + + + + + ���������@� +reshape +x + + linear_55 +shape + + +var_1007+ +var_1008 +  + +� + +@* +name + + " +op_1008q +const +var_1009_perm_0 + + +*$ +name + +" +op_1009_perm_0*! +val + + + + + +� +linear" +x + +encoder_last_hidden_stateE +weight; +9 +7model_model_decoder_layers_5_encoder_attn_v_proj_weightA +bias9 +7 +5model_model_decoder_layers_5_encoder_attn_v_proj_bias' + linear_56 +  + +� +�* +name + + " + linear_56l +const +var_1014 + + +* +name + + " +op_1014** +val# + + + + + ���������@� +reshape +x + + linear_56 +shape + + +var_1014+ +var_1015 +  + +� + +@* +name + + " +op_1015q +const +var_1016_perm_0 + + +*$ +name + +" +op_1016_perm_0*! +val + + + + + +d +const +var_1023 + + +* +name + + " +op_1023*" +val + + + +  +�@� +reshape +x + +tensor_workaround +shape + + +var_1023+ +var_1024 +  + +� + +@* +name + + " +op_1024q +const +var_1025_perm_0 + + +*$ +name + +" +op_1025_perm_0*! +val + + + + + +k +const +var_1027 + + +* +name + + " +op_1027*) +val" + + + + + ���������@� + transpose +x + + +var_1024 +perm + +var_1025_perm_0. + transpose_2 +  + + +� +@*! +name + +" + transpose_2� +reshape +x + + transpose_2 +shape + + +var_1027) + query_states +  + +� +@*" +name + +" + query_statesk +const +var_1029 + + +* +name + + " +op_1029*) +val" + + + + + ���������@� + transpose +x + + +var_1008 +perm + +var_1009_perm_0. + transpose_4 +  + + +� +@*! +name + +" + transpose_4� +reshape +x + + transpose_4 +shape + + +var_1029' + +key_states +  + +� +@* +name + +" + +key_statesk +const +var_1031 + + +* +name + + " +op_1031*) +val" + + + + + ���������@� + transpose +x + + +var_1015 +perm + +var_1016_perm_0. + transpose_3 +  + + +� +@*! +name + +" + transpose_3� +reshape +x + + transpose_3 +shape + + +var_1031) + value_states +  + +� +@*" +name + +" + value_statesp +const +var_1034_perm_0 + + +*$ +name + +" +op_1034_perm_0* +val + + + + +{ +const% +attn_weights_67_transpose_x_0 +*3 +name+ +# +!" +attn_weights_67_transpose_x_0* +val + + +{ +const% +attn_weights_67_transpose_y_0 +*3 +name+ +# +!" +attn_weights_67_transpose_y_0* +val + + +� + transpose +x + + +key_states +perm + +var_1034_perm_0( + transpose_1 +  + +@ +�*! +name + +" + transpose_1� +matmul +x + + query_states +y + + transpose_10 + transpose_x! + +attn_weights_67_transpose_x_00 + transpose_y! + +attn_weights_67_transpose_y_0- +attn_weights_67 +  + +� +�*% +name + +" +attn_weights_67e +const +var_1036 + + +* +name + + " +op_1036*# +val + + + + + +��� +reshape +x + +attn_weights_67 +shape + + +var_1036, +var_1037 +  + + +� +�* +name + + " +op_1037� +add +x + + +var_1037 +y + +attention_mask3 +attn_weights_69 +  + + +� +�*% +name + +" +attn_weights_69d +const +var_1042 + + +* +name + + " +op_1042*" +val + + + +  +��� +reshape +x + +attn_weights_69 +shape + + +var_1042' + input_179 +  + +� +�* +name + + " + input_179{ +softmax +x + + input_179 +axis + + +var_21' + input_181 +  + +� +�* +name + + " + input_181y +const$ +attn_output_67_transpose_x_0 +*2 +name* +" + " +attn_output_67_transpose_x_0* +val + + +y +const$ +attn_output_67_transpose_y_0 +*2 +name* +" + " +attn_output_67_transpose_y_0* +val + + +� +matmul +x + + input_181 +y + + value_states/ + transpose_x + +attn_output_67_transpose_x_0/ + transpose_y + +attn_output_67_transpose_y_0+ +attn_output_67 +  + +� +@*$ +name + +" +attn_output_67d +const +var_1047 + + +* +name + + " +op_1047*" +val + + + +  +�@� +reshape +x + +attn_output_67 +shape + + +var_10471 +attn_output_69 +  + + +� +@*$ +name + +" +attn_output_69x +const" +attn_output_perm_0 + + +*( +name  + +" +attn_output_perm_0*! +val + + + + + +d +const +var_1050 + + +* +name + + " +op_1050*" +val + + + +  +��� + transpose +x + +attn_output_69 +perm + +attn_output_perm_0. + transpose_0 +  + +� + +@*! +name + +" + transpose_0� +reshape +x + + transpose_0 +shape + + +var_1050' + input_183 +  + +� +�* +name + + " + input_183� +linear +x + + input_183G +weight= +; +9model_model_decoder_layers_5_encoder_attn_out_proj_weightC +bias; +9 +7model_model_decoder_layers_5_encoder_attn_out_proj_bias' + linear_57 +  + +� +�* +name + + " + linear_57~ +add +x + +hidden_states_55 +y + + linear_57' + input_187 +  + +� +�* +name + + " + input_187z +const +input_189_axes_0 + + +*& +name + +" +input_189_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + input_187 +axes + +input_189_axes_0H +gamma? += +;model_model_decoder_layers_5_encoder_attn_layer_norm_weightE +beta= +; +9model_model_decoder_layers_5_encoder_attn_layer_norm_bias +epsilon + + +var_12' + input_189 +  + +� +�* +name + + " + input_189� +linear +x + + input_1895 +weight+ +) +'model_model_decoder_layers_5_fc1_weight1 +bias) +' +%model_model_decoder_layers_5_fc1_bias' + linear_58 +  + +� +� * +name + + " + linear_58e +const +input_193_mode_0 +*& +name + +" +input_193_mode_0* +val + + " +EXACT� +gelu +x + + linear_58 +mode + +input_193_mode_0' + input_193 +  + +� +� * +name + + " + input_193� +linear +x + + input_1935 +weight+ +) +'model_model_decoder_layers_5_fc2_weight1 +bias) +' +%model_model_decoder_layers_5_fc2_bias' + linear_59 +  + +� +�* +name + + " + linear_59w +add +x + + input_189 +y + + linear_59' + input_199 +  + +� +�* +name + + " + input_199r +const + input_axes_0 + + +*" +name + +" + input_axes_0*' +val  + + + + + +���������� + +layer_norm +x + + input_199 +axes + + input_axes_0A +gamma8 +6 +4model_model_decoder_layers_5_final_layer_norm_weight> +beta6 +4 +2model_model_decoder_layers_5_final_layer_norm_bias +epsilon + + +var_12# +input +  + +� +�* +name + + " +input� +const! +var_1078_bias_0 +   +؈*% +name + +" +var_1078_bias_0*? +val8 +   +؈*& +@model_path/weights/weight.bin��ע� +linear +x + +input' +weight + +model_model_shared_weight +bias + +var_1078_bias_0% +logits +  + +� +؈* +name + + " + +var_1078"� + buildInfo�" + + +|"z +6 +! + +" +coremltools-version + +" +7.0 +@ +) +! +" +coremltools-component-torch + + " +2.0.1 \ No newline at end of file