3root"_tf_keras_model*3{"name": "tfm_t5for_conditional_generation", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "must_restore_from_config": false, "class_name": "TFMT5ForConditionalGeneration", "config": {"return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "pruned_heads": {}, "tie_word_embeddings": false, "is_encoder_decoder": true, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "architectures": ["T5ForConditionalGeneration"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": "T5Tokenizer", "prefix": null, "bos_token_id": null, "pad_token_id": 0, "eos_token_id": 1, "sep_token_id": null, "decoder_start_token_id": 0, "task_specific_params": {"summarization": {"early_stopping": true, "length_penalty": 2.0, "max_length": 200, "min_length": 30, "no_repeat_ngram_size": 3, "num_beams": 4, "prefix": "summarize: "}, "translation_en_to_de": {"early_stopping": true, "max_length": 300, "num_beams": 4, "prefix": "translate English to German: "}, "translation_en_to_fr": {"early_stopping": true, "max_length": 300, "num_beams": 4, "prefix": "translate English to French: "}, "translation_en_to_ro": {"early_stopping": true, "max_length": 300, "num_beams": 4, "prefix": "translate English to Romanian: "}}, "problem_type": null, "_name_or_path": "google/flan-t5-base", "transformers_version": "4.20.1", "model_type": "mt5", "n_positions": 512, "output_past": true, "vocab_size": 32128, "d_model": 768, "d_kv": 64, "d_ff": 2048, "num_layers": 12, "num_decoder_layers": 12, "num_heads": 12, "relative_attention_num_buckets": 32, "relative_attention_max_distance": 128, "dropout_rate": 0.1, "layer_norm_epsilon": 1e-06, "initializer_factor": 1.0, "feed_forward_proj": "gated-gelu", "use_cache": true, "dense_act_fn": "gelu_new", "is_gated_act": true}, "shared_object_id": 0, "is_graph_network": false, "full_save_spec": {"class_name": "__tuple__", "items": [[{"input_ids": {"class_name": "TypeSpec", "type_spec": "tf.TensorSpec", "serialized": [{"class_name": "TensorShape", "items": [3, 5]}, "int32", "input_ids"]}, "decoder_input_ids": {"class_name": "TypeSpec", "type_spec": "tf.TensorSpec", "serialized": [{"class_name": "TensorShape", "items": [3, 5]}, "int32", "decoder_input_ids"]}, "decoder_attention_mask": {"class_name": "TypeSpec", "type_spec": "tf.TensorSpec", "serialized": [{"class_name": "TensorShape", "items": [3, 5]}, "int32", "decoder_attention_mask"]}}], {}]}, "save_spec": {"input_ids": {"class_name": "TypeSpec", "type_spec": "tf.TensorSpec", "serialized": [{"class_name": "TensorShape", "items": [3, 5]}, "int32", "input_ids"]}, "decoder_input_ids": {"class_name": "TypeSpec", "type_spec": "tf.TensorSpec", "serialized": [{"class_name": "TensorShape", "items": [3, 5]}, "int32", "decoder_input_ids"]}, "decoder_attention_mask": {"class_name": "TypeSpec", "type_spec": "tf.TensorSpec", "serialized": [{"class_name": "TensorShape", "items": [3, 5]}, "int32", "decoder_attention_mask"]}}, "keras_version": "2.6.0", "backend": "tensorflow", "model_config": {"class_name": "TFMT5ForConditionalGeneration", "config": {"return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "pruned_heads": {}, "tie_word_embeddings": false, "is_encoder_decoder": true, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "architectures": ["T5ForConditionalGeneration"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": "T5Tokenizer", "prefix": null, "bos_token_id": null, "pad_token_id": 0, "eos_token_id": 1, "sep_token_id": null, "decoder_start_token_id": 0, "task_specific_params": {"summarization": {"early_stopping": true, "length_penalty": 2.0, "max_length": 200, "min_length": 30, "no_repeat_ngram_size": 3, "num_beams": 4, "prefix": "summarize: "}, "translation_en_to_de": {"early_stopping": true, "max_length": 300, "num_beams": 4, "prefix": "translate English to German: "}, "translation_en_to_fr": {"early_stopping": true, "max_length": 300, "num_beams": 4, "prefix": "translate English to French: "}, "translation_en_to_ro": {"early_stopping": true, "max_length": 300, "num_beams": 4, "prefix": "translate English to Romanian: "}}, "problem_type": null, "_name_or_path": "google/flan-t5-base", "transformers_version": "4.20.1", "model_type": "mt5", "n_positions": 512, "output_past": true, "vocab_size": 32128, "d_model": 768, "d_kv": 64, "d_ff": 2048, "num_layers": 12, "num_decoder_layers": 12, "num_heads": 12, "relative_attention_num_buckets": 32, "relative_attention_max_distance": 128, "dropout_rate": 0.1, "layer_norm_epsilon": 1e-06, "initializer_factor": 1.0, "feed_forward_proj": "gated-gelu", "use_cache": true, "dense_act_fn": "gelu_new", "is_gated_act": true}}, "training_config": {"loss": "dummy_loss", "metrics": null, "weighted_metrics": null, "loss_weights": null, "optimizer_config": {"class_name": "Adam", "config": {"name": "Adam", "learning_rate": 2.9999999242136255e-05, "decay": 0.0, "beta_1": 0.8999999761581421, "beta_2": 0.9990000128746033, "epsilon": 1e-07, "amsgrad": false}}}}2  root.shared"_tf_keras_layer*{"name": "shared", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFSharedEmbeddings", "config": {"name": "shared", "trainable": true, "dtype": "float32", "vocab_size": 32128, "hidden_size": 768, "initializer_range": 1.0}, "shared_object_id": 1, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5]}}2  root.encoder"_tf_keras_layer*{"name": "encoder", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Custom>TFT5MainLayer", "config": {"name": "encoder", "trainable": true, "dtype": "float32", "config": {"return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "pruned_heads": {}, "tie_word_embeddings": false, "is_encoder_decoder": true, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "architectures": ["T5ForConditionalGeneration"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": "T5Tokenizer", "prefix": null, "bos_token_id": null, "pad_token_id": 0, "eos_token_id": 1, "sep_token_id": null, "decoder_start_token_id": 0, "task_specific_params": {"summarization": {"early_stopping": true, "length_penalty": 2.0, "max_length": 200, "min_length": 30, "no_repeat_ngram_size": 3, "num_beams": 4, "prefix": "summarize: "}, "translation_en_to_de": {"early_stopping": true, "max_length": 300, "num_beams": 4, "prefix": "translate English to German: "}, "translation_en_to_fr": {"early_stopping": true, "max_length": 300, "num_beams": 4, "prefix": "translate English to French: "}, "translation_en_to_ro": {"early_stopping": true, "max_length": 300, "num_beams": 4, "prefix": "translate English to Romanian: "}}, "problem_type": null, "_name_or_path": "google/flan-t5-base", "transformers_version": "4.20.1", "model_type": "mt5", "n_positions": 512, "output_past": true, "vocab_size": 32128, "d_model": 768, "d_kv": 64, "d_ff": 2048, "num_layers": 12, "num_decoder_layers": 12, "num_heads": 12, "relative_attention_num_buckets": 32, "relative_attention_max_distance": 128, "dropout_rate": 0.1, "layer_norm_epsilon": 1e-06, "initializer_factor": 1.0, "feed_forward_proj": "gated-gelu", "use_cache": false, "dense_act_fn": "gelu_new", "is_gated_act": true}}, "shared_object_id": 2}2  root.decoder"_tf_keras_layer*{"name": "decoder", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Custom>TFT5MainLayer", "config": {"name": "decoder", "trainable": true, "dtype": "float32", "config": {"return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "pruned_heads": {}, "tie_word_embeddings": false, "is_encoder_decoder": true, "is_decoder": true, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "architectures": ["T5ForConditionalGeneration"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": "T5Tokenizer", "prefix": null, "bos_token_id": null, "pad_token_id": 0, "eos_token_id": 1, "sep_token_id": null, "decoder_start_token_id": 0, "task_specific_params": {"summarization": {"early_stopping": true, "length_penalty": 2.0, "max_length": 200, "min_length": 30, "no_repeat_ngram_size": 3, "num_beams": 4, "prefix": "summarize: "}, "translation_en_to_de": {"early_stopping": true, "max_length": 300, "num_beams": 4, "prefix": "translate English to German: "}, "translation_en_to_fr": {"early_stopping": true, "max_length": 300, "num_beams": 4, "prefix": "translate English to French: "}, "translation_en_to_ro": {"early_stopping": true, "max_length": 300, "num_beams": 4, "prefix": "translate English to Romanian: "}}, "problem_type": null, "_name_or_path": "google/flan-t5-base", "transformers_version": "4.20.1", "model_type": "mt5", "n_positions": 512, "output_past": true, "vocab_size": 32128, "d_model": 768, "d_kv": 64, "d_ff": 2048, "num_layers": 12, "num_decoder_layers": 12, "num_heads": 12, "relative_attention_num_buckets": 32, "relative_attention_max_distance": 128, "dropout_rate": 0.1, "layer_norm_epsilon": 1e-06, "initializer_factor": 1.0, "feed_forward_proj": "gated-gelu", "use_cache": true, "dense_act_fn": "gelu_new", "is_gated_act": true}}, "shared_object_id": 3}2  root.lm_head"_tf_keras_layer*{"name": "lm_head", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "lm_head", "trainable": true, "dtype": "float32", "units": 32128, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 1.0, "seed": null}, "shared_object_id": 4}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 5}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 6, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 7}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 root.encoder.final_layer_norm"_tf_keras_layer*{"name": "final_layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 root.encoder.dropout"_tf_keras_layer*{"name": "dropout_48", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_48", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 8}2 root.decoder.final_layer_norm"_tf_keras_layer*{"name": "final_layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 root.decoder.dropout"_tf_keras_layer*{"name": "dropout_121", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_121", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 9}2 root.encoder.block.0"_tf_keras_layer*{"name": "block_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.encoder.block.1"_tf_keras_layer*{"name": "block_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.encoder.block.2"_tf_keras_layer*{"name": "block_._2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.encoder.block.3"_tf_keras_layer*{"name": "block_._3", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.encoder.block.4"_tf_keras_layer*{"name": "block_._4", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.encoder.block.5"_tf_keras_layer*{"name": "block_._5", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.encoder.block.6"_tf_keras_layer*{"name": "block_._6", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.encoder.block.7"_tf_keras_layer*{"name": "block_._7", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.encoder.block.8"_tf_keras_layer*{"name": "block_._8", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.encoder.block.9"_tf_keras_layer*{"name": "block_._9", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.encoder.block.10"_tf_keras_layer*{"name": "block_._10", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.encoder.block.11"_tf_keras_layer*{"name": "block_._11", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.decoder.block.0"_tf_keras_layer*{"name": "block_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.decoder.block.1"_tf_keras_layer*{"name": "block_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.decoder.block.2"_tf_keras_layer*{"name": "block_._2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.decoder.block.3"_tf_keras_layer*{"name": "block_._3", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.decoder.block.4"_tf_keras_layer*{"name": "block_._4", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.decoder.block.5"_tf_keras_layer*{"name": "block_._5", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.decoder.block.6"_tf_keras_layer*{"name": "block_._6", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.decoder.block.7"_tf_keras_layer*{"name": "block_._7", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.decoder.block.8"_tf_keras_layer*{"name": "block_._8", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.decoder.block.9"_tf_keras_layer*{"name": "block_._9", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.decoder.block.10"_tf_keras_layer*{"name": "block_._10", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.decoder.block.11"_tf_keras_layer*{"name": "block_._11", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Block", "config": {"layer was saved without config": true}}2 root.keras_api.metrics.0"_tf_keras_metric*{"class_name": "Mean", "name": "loss", "dtype": "float32", "config": {"name": "loss", "dtype": "float32"}, "shared_object_id": 10}2 root.encoder.block.0.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.encoder.block.0.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.encoder.block.1.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.encoder.block.1.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.encoder.block.2.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.encoder.block.2.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.encoder.block.3.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.encoder.block.3.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.encoder.block.4.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.encoder.block.4.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.encoder.block.5.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.encoder.block.5.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.encoder.block.6.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.encoder.block.6.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.encoder.block.7.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.encoder.block.7.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.encoder.block.8.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.encoder.block.8.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.encoder.block.9.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.encoder.block.9.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.encoder.block.10.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.encoder.block.10.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.encoder.block.11.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.encoder.block.11.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.decoder.block.0.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.0.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerCrossAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.0.layer.2"_tf_keras_layer*{"name": "layer_._2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.decoder.block.1.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.1.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerCrossAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.1.layer.2"_tf_keras_layer*{"name": "layer_._2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.decoder.block.2.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.2.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerCrossAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.2.layer.2"_tf_keras_layer*{"name": "layer_._2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.decoder.block.3.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.3.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerCrossAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.3.layer.2"_tf_keras_layer*{"name": "layer_._2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.decoder.block.4.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.4.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerCrossAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.4.layer.2"_tf_keras_layer*{"name": "layer_._2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.decoder.block.5.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.5.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerCrossAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.5.layer.2"_tf_keras_layer*{"name": "layer_._2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.decoder.block.6.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.6.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerCrossAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.6.layer.2"_tf_keras_layer*{"name": "layer_._2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.decoder.block.7.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.7.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerCrossAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.7.layer.2"_tf_keras_layer*{"name": "layer_._2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.decoder.block.8.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.8.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerCrossAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.8.layer.2"_tf_keras_layer*{"name": "layer_._2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.decoder.block.9.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.9.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerCrossAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.9.layer.2"_tf_keras_layer*{"name": "layer_._2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.decoder.block.10.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.10.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerCrossAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.10.layer.2"_tf_keras_layer*{"name": "layer_._2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 root.decoder.block.11.layer.0"_tf_keras_layer*{"name": "layer_._0", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerSelfAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.11.layer.1"_tf_keras_layer*{"name": "layer_._1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerCrossAttention", "config": {"layer was saved without config": true}}2 root.decoder.block.11.layer.2"_tf_keras_layer*{"name": "layer_._2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerFF", "config": {"layer was saved without config": true}}2 *root.encoder.block.0.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.encoder.block.0.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.0.layer.0.dropout"_tf_keras_layer*{"name": "dropout_1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_1", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 11}2 +root.encoder.block.0.layer.1.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.encoder.block.0.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.0.layer.1.dropout"_tf_keras_layer*{"name": "dropout_3", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_3", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 12}2 *root.encoder.block.1.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.encoder.block.1.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.1.layer.0.dropout"_tf_keras_layer*{"name": "dropout_5", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_5", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 13}2 +root.encoder.block.1.layer.1.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.encoder.block.1.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.1.layer.1.dropout"_tf_keras_layer*{"name": "dropout_7", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_7", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 14}2 *root.encoder.block.2.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.encoder.block.2.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.2.layer.0.dropout"_tf_keras_layer*{"name": "dropout_9", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_9", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 15}2 +root.encoder.block.2.layer.1.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.encoder.block.2.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.2.layer.1.dropout"_tf_keras_layer*{"name": "dropout_11", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_11", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 16}2 *root.encoder.block.3.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.encoder.block.3.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.3.layer.0.dropout"_tf_keras_layer*{"name": "dropout_13", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_13", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 17}2 +root.encoder.block.3.layer.1.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.encoder.block.3.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.3.layer.1.dropout"_tf_keras_layer*{"name": "dropout_15", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_15", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 18}2 *root.encoder.block.4.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.encoder.block.4.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.4.layer.0.dropout"_tf_keras_layer*{"name": "dropout_17", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_17", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 19}2 +root.encoder.block.4.layer.1.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.encoder.block.4.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.4.layer.1.dropout"_tf_keras_layer*{"name": "dropout_19", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_19", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 20}2 *root.encoder.block.5.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.encoder.block.5.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.5.layer.0.dropout"_tf_keras_layer*{"name": "dropout_21", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_21", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 21}2 +root.encoder.block.5.layer.1.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.encoder.block.5.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.5.layer.1.dropout"_tf_keras_layer*{"name": "dropout_23", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_23", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 22}2 *root.encoder.block.6.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.encoder.block.6.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.6.layer.0.dropout"_tf_keras_layer*{"name": "dropout_25", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_25", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 23}2 +root.encoder.block.6.layer.1.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.encoder.block.6.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.6.layer.1.dropout"_tf_keras_layer*{"name": "dropout_27", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_27", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 24}2 *root.encoder.block.7.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.encoder.block.7.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.7.layer.0.dropout"_tf_keras_layer*{"name": "dropout_29", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_29", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 25}2 +root.encoder.block.7.layer.1.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.encoder.block.7.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.7.layer.1.dropout"_tf_keras_layer*{"name": "dropout_31", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_31", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 26}2 *root.encoder.block.8.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.encoder.block.8.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.8.layer.0.dropout"_tf_keras_layer*{"name": "dropout_33", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_33", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 27}2 +root.encoder.block.8.layer.1.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.encoder.block.8.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.8.layer.1.dropout"_tf_keras_layer*{"name": "dropout_35", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_35", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 28}2 *root.encoder.block.9.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.encoder.block.9.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.9.layer.0.dropout"_tf_keras_layer*{"name": "dropout_37", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_37", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 29}2 +root.encoder.block.9.layer.1.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.encoder.block.9.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.encoder.block.9.layer.1.dropout"_tf_keras_layer*{"name": "dropout_39", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_39", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 30}2 +root.encoder.block.10.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 (root.encoder.block.10.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 %root.encoder.block.10.layer.0.dropout"_tf_keras_layer*{"name": "dropout_41", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_41", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 31}2 ,root.encoder.block.10.layer.1.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 (root.encoder.block.10.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 %root.encoder.block.10.layer.1.dropout"_tf_keras_layer*{"name": "dropout_43", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_43", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 32}2 +root.encoder.block.11.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 (root.encoder.block.11.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 %root.encoder.block.11.layer.0.dropout"_tf_keras_layer*{"name": "dropout_45", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_45", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 33}2 ,root.encoder.block.11.layer.1.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 (root.encoder.block.11.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 %root.encoder.block.11.layer.1.dropout"_tf_keras_layer*{"name": "dropout_47", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_47", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 34}2 *root.decoder.block.0.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.0.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.0.layer.0.dropout"_tf_keras_layer*{"name": "dropout_50", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_50", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 35}2 ,root.decoder.block.0.layer.1.EncDecAttention"_tf_keras_layer*{"name": "EncDecAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.0.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.0.layer.1.dropout"_tf_keras_layer*{"name": "dropout_52", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_52", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 36}2 +root.decoder.block.0.layer.2.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.decoder.block.0.layer.2.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.0.layer.2.dropout"_tf_keras_layer*{"name": "dropout_54", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_54", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 37}2 *root.decoder.block.1.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.1.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.1.layer.0.dropout"_tf_keras_layer*{"name": "dropout_56", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_56", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 38}2 ,root.decoder.block.1.layer.1.EncDecAttention"_tf_keras_layer*{"name": "EncDecAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.1.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.1.layer.1.dropout"_tf_keras_layer*{"name": "dropout_58", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_58", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 39}2 +root.decoder.block.1.layer.2.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.decoder.block.1.layer.2.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.1.layer.2.dropout"_tf_keras_layer*{"name": "dropout_60", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_60", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 40}2 *root.decoder.block.2.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.2.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.2.layer.0.dropout"_tf_keras_layer*{"name": "dropout_62", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_62", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 41}2 ,root.decoder.block.2.layer.1.EncDecAttention"_tf_keras_layer*{"name": "EncDecAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.2.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.2.layer.1.dropout"_tf_keras_layer*{"name": "dropout_64", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_64", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 42}2 +root.decoder.block.2.layer.2.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.decoder.block.2.layer.2.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.2.layer.2.dropout"_tf_keras_layer*{"name": "dropout_66", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_66", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 43}2 *root.decoder.block.3.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.3.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.3.layer.0.dropout"_tf_keras_layer*{"name": "dropout_68", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_68", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 44}2 ,root.decoder.block.3.layer.1.EncDecAttention"_tf_keras_layer*{"name": "EncDecAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.3.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.3.layer.1.dropout"_tf_keras_layer*{"name": "dropout_70", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_70", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 45}2 +root.decoder.block.3.layer.2.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.decoder.block.3.layer.2.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.3.layer.2.dropout"_tf_keras_layer*{"name": "dropout_72", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_72", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 46}2 *root.decoder.block.4.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.4.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.4.layer.0.dropout"_tf_keras_layer*{"name": "dropout_74", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_74", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 47}2 ,root.decoder.block.4.layer.1.EncDecAttention"_tf_keras_layer*{"name": "EncDecAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.4.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.4.layer.1.dropout"_tf_keras_layer*{"name": "dropout_76", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_76", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 48}2 +root.decoder.block.4.layer.2.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.decoder.block.4.layer.2.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.4.layer.2.dropout"_tf_keras_layer*{"name": "dropout_78", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_78", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 49}2 *root.decoder.block.5.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.5.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.5.layer.0.dropout"_tf_keras_layer*{"name": "dropout_80", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_80", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 50}2 ,root.decoder.block.5.layer.1.EncDecAttention"_tf_keras_layer*{"name": "EncDecAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.5.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.5.layer.1.dropout"_tf_keras_layer*{"name": "dropout_82", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_82", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 51}2 +root.decoder.block.5.layer.2.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.decoder.block.5.layer.2.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.5.layer.2.dropout"_tf_keras_layer*{"name": "dropout_84", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_84", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 52}2 *root.decoder.block.6.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.6.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.6.layer.0.dropout"_tf_keras_layer*{"name": "dropout_86", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_86", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 53}2 ,root.decoder.block.6.layer.1.EncDecAttention"_tf_keras_layer*{"name": "EncDecAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.6.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.6.layer.1.dropout"_tf_keras_layer*{"name": "dropout_88", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_88", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 54}2 +root.decoder.block.6.layer.2.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.decoder.block.6.layer.2.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.6.layer.2.dropout"_tf_keras_layer*{"name": "dropout_90", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_90", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 55}2 *root.decoder.block.7.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.7.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.7.layer.0.dropout"_tf_keras_layer*{"name": "dropout_92", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_92", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 56}2 ,root.decoder.block.7.layer.1.EncDecAttention"_tf_keras_layer*{"name": "EncDecAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.7.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.7.layer.1.dropout"_tf_keras_layer*{"name": "dropout_94", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_94", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 57}2 +root.decoder.block.7.layer.2.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.decoder.block.7.layer.2.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.7.layer.2.dropout"_tf_keras_layer*{"name": "dropout_96", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_96", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 58}2 *root.decoder.block.8.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.8.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.8.layer.0.dropout"_tf_keras_layer*{"name": "dropout_98", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_98", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 59}2 ,root.decoder.block.8.layer.1.EncDecAttention"_tf_keras_layer*{"name": "EncDecAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.8.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.8.layer.1.dropout"_tf_keras_layer*{"name": "dropout_100", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_100", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 60}2 +root.decoder.block.8.layer.2.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.decoder.block.8.layer.2.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.8.layer.2.dropout"_tf_keras_layer*{"name": "dropout_102", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_102", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 61}2 *root.decoder.block.9.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.9.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.9.layer.0.dropout"_tf_keras_layer*{"name": "dropout_104", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_104", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 62}2 ,root.decoder.block.9.layer.1.EncDecAttention"_tf_keras_layer*{"name": "EncDecAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 'root.decoder.block.9.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.9.layer.1.dropout"_tf_keras_layer*{"name": "dropout_106", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_106", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 63}2 +root.decoder.block.9.layer.2.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 'root.decoder.block.9.layer.2.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 $root.decoder.block.9.layer.2.dropout"_tf_keras_layer*{"name": "dropout_108", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_108", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 64}2 +root.decoder.block.10.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 (root.decoder.block.10.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 %root.decoder.block.10.layer.0.dropout"_tf_keras_layer*{"name": "dropout_110", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_110", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 65}2 -root.decoder.block.10.layer.1.EncDecAttention"_tf_keras_layer*{"name": "EncDecAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 (root.decoder.block.10.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 %root.decoder.block.10.layer.1.dropout"_tf_keras_layer*{"name": "dropout_112", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_112", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 66}2 ,root.decoder.block.10.layer.2.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 (root.decoder.block.10.layer.2.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 %root.decoder.block.10.layer.2.dropout"_tf_keras_layer*{"name": "dropout_114", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_114", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 67}2 +root.decoder.block.11.layer.0.SelfAttention"_tf_keras_layer*{"name": "SelfAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 (root.decoder.block.11.layer.0.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 %root.decoder.block.11.layer.0.dropout"_tf_keras_layer*{"name": "dropout_116", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_116", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 68}2 -root.decoder.block.11.layer.1.EncDecAttention"_tf_keras_layer*{"name": "EncDecAttention", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5Attention", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 (root.decoder.block.11.layer.1.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 %root.decoder.block.11.layer.1.dropout"_tf_keras_layer*{"name": "dropout_118", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_118", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 69}2 ,root.decoder.block.11.layer.2.DenseReluDense"_tf_keras_layer*{"name": "DenseReluDense", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5DenseGatedActDense", "config": {"layer was saved without config": true}}2 (root.decoder.block.11.layer.2.layer_norm"_tf_keras_layer*{"name": "layer_norm", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "TFT5LayerNorm", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 %root.decoder.block.11.layer.2.dropout"_tf_keras_layer*{"name": "dropout_120", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_120", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 70}2 ,root.encoder.block.0.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 71}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 72}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 73, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 74}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.encoder.block.0.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 75}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 76}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 77, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 78}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.encoder.block.0.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 79}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 80}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 81, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 82}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.encoder.block.0.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 83}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 84}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 85, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 86}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 2root.encoder.block.0.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 87}2  0root.encoder.block.0.layer.1.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 88}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 89}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 90, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 91}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  0root.encoder.block.0.layer.1.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 88}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 92}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 93, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 94}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.encoder.block.0.layer.1.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 95}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 96}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 97, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 98}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2  3root.encoder.block.0.layer.1.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_2", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_2", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 99}2  ,root.encoder.block.1.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 100}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 101}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 102, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 103}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.1.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 104}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 105}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 106, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 107}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.1.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 108}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 109}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 110, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 111}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.1.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 112}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 113}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 114, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 115}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  2root.encoder.block.1.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_4", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_4", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 116}2  0root.encoder.block.1.layer.1.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 117}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 118}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 119, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 120}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  0root.encoder.block.1.layer.1.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 117}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 121}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 122, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 123}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.encoder.block.1.layer.1.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 124}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 125}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 126, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 127}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2  3root.encoder.block.1.layer.1.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_6", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_6", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 128}2  ,root.encoder.block.2.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 129}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 130}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 131, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 132}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.2.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 133}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 134}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 135, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 136}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.2.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 137}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 138}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 139, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 140}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.2.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 141}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 142}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 143, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 144}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  2root.encoder.block.2.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_8", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_8", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 145}2  0root.encoder.block.2.layer.1.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 146}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 147}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 148, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 149}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  0root.encoder.block.2.layer.1.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 146}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 150}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 151, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 152}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.encoder.block.2.layer.1.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 153}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 154}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 155, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 156}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2  3root.encoder.block.2.layer.1.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_10", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_10", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 157}2  ,root.encoder.block.3.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 158}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 159}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 160, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 161}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.3.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 162}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 163}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 164, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 165}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.3.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 166}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 167}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 168, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 169}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.3.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 170}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 171}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 172, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 173}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  2root.encoder.block.3.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_12", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_12", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 174}2  0root.encoder.block.3.layer.1.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 175}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 176}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 177, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 178}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  0root.encoder.block.3.layer.1.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 175}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 179}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 180, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 181}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.encoder.block.3.layer.1.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 182}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 183}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 184, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 185}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2  3root.encoder.block.3.layer.1.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_14", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_14", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 186}2  ,root.encoder.block.4.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 187}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 188}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 189, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 190}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.4.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 191}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 192}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 193, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 194}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.4.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 195}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 196}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 197, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 198}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.4.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 199}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 200}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 201, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 202}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  2root.encoder.block.4.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_16", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_16", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 203}2  0root.encoder.block.4.layer.1.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 204}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 205}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 206, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 207}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  0root.encoder.block.4.layer.1.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 204}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 208}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 209, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 210}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.encoder.block.4.layer.1.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 211}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 212}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 213, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 214}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2  3root.encoder.block.4.layer.1.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_18", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_18", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 215}2  ,root.encoder.block.5.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 216}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 217}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 218, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 219}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.5.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 220}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 221}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 222, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 223}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.5.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 224}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 225}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 226, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 227}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.5.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 228}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 229}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 230, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 231}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  2root.encoder.block.5.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_20", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_20", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 232}2  0root.encoder.block.5.layer.1.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 233}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 234}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 235, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 236}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  0root.encoder.block.5.layer.1.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 233}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 237}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 238, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 239}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.encoder.block.5.layer.1.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 240}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 241}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 242, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 243}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2  3root.encoder.block.5.layer.1.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_22", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_22", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 244}2  ,root.encoder.block.6.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 245}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 246}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 247, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 248}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.6.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 249}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 250}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 251, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 252}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.6.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 253}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 254}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 255, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 256}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.6.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 257}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 258}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 259, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 260}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  2root.encoder.block.6.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_24", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_24", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 261}2  0root.encoder.block.6.layer.1.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 262}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 263}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 264, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 265}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  0root.encoder.block.6.layer.1.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 262}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 266}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 267, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 268}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.encoder.block.6.layer.1.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 269}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 270}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 271, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 272}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2  3root.encoder.block.6.layer.1.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_26", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_26", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 273}2  ,root.encoder.block.7.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 274}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 275}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 276, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 277}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.7.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 278}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 279}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 280, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 281}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.7.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 282}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 283}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 284, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 285}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.7.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 286}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 287}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 288, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 289}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  2root.encoder.block.7.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_28", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_28", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 290}2  0root.encoder.block.7.layer.1.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 291}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 292}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 293, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 294}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  0root.encoder.block.7.layer.1.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 291}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 295}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 296, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 297}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.encoder.block.7.layer.1.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 298}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 299}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 300, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 301}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2  3root.encoder.block.7.layer.1.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_30", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_30", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 302}2  ,root.encoder.block.8.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 303}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 304}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 305, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 306}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.8.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 307}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 308}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 309, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 310}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.8.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 311}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 312}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 313, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 314}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.8.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 315}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 316}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 317, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 318}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  2root.encoder.block.8.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_32", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_32", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 319}2  0root.encoder.block.8.layer.1.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 320}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 321}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 322, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 323}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  0root.encoder.block.8.layer.1.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 320}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 324}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 325, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 326}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.encoder.block.8.layer.1.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 327}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 328}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 329, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 330}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2  3root.encoder.block.8.layer.1.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_34", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_34", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 331}2  ,root.encoder.block.9.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 332}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 333}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 334, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 335}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.9.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 336}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 337}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 338, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 339}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.9.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 340}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 341}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 342, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 343}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.encoder.block.9.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 344}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 345}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 346, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 347}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  2root.encoder.block.9.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_36", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_36", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 348}2  0root.encoder.block.9.layer.1.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 349}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 350}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 351, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 352}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  0root.encoder.block.9.layer.1.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 349}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 353}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 354, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 355}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.encoder.block.9.layer.1.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 356}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 357}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 358, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 359}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2  3root.encoder.block.9.layer.1.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_38", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_38", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 360}2  -root.encoder.block.10.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 361}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 362}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 363, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 364}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  -root.encoder.block.10.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 365}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 366}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 367, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 368}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  -root.encoder.block.10.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 369}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 370}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 371, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 372}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  -root.encoder.block.10.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 373}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 374}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 375, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 376}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  3root.encoder.block.10.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_40", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_40", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 377}2  1root.encoder.block.10.layer.1.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 378}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 379}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 380, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 381}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  1root.encoder.block.10.layer.1.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 378}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 382}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 383, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 384}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  /root.encoder.block.10.layer.1.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 385}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 386}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 387, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 388}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2  4root.encoder.block.10.layer.1.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_42", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_42", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 389}2  -root.encoder.block.11.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 390}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 391}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 392, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 393}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  -root.encoder.block.11.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 394}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 395}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 396, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 397}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  -root.encoder.block.11.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 398}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 399}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 400, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 401}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  -root.encoder.block.11.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 402}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 403}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 404, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 405}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  3root.encoder.block.11.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_44", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_44", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 406}2  1root.encoder.block.11.layer.1.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 407}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 408}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 409, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 410}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  1root.encoder.block.11.layer.1.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 407}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 411}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 412, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 413}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  /root.encoder.block.11.layer.1.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 414}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 415}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 416, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 417}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2  4root.encoder.block.11.layer.1.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_46", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_46", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 418}2  ,root.decoder.block.0.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 419}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 420}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 421, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 422}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.decoder.block.0.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 423}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 424}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 425, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 426}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.decoder.block.0.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 427}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 428}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 429, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 430}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.decoder.block.0.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 431}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 432}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 433, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 434}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  2root.decoder.block.0.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_49", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_49", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 435}2  .root.decoder.block.0.layer.1.EncDecAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 436}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 437}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 438, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 439}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.decoder.block.0.layer.1.EncDecAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 440}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 441}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 442, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 443}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.decoder.block.0.layer.1.EncDecAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 444}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 445}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 446, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 447}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.decoder.block.0.layer.1.EncDecAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 448}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 449}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 450, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 451}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  4root.decoder.block.0.layer.1.EncDecAttention.dropout"_tf_keras_layer*{"name": "dropout_51", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_51", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 452}2  0root.decoder.block.0.layer.2.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 453}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 454}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 455, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 456}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  0root.decoder.block.0.layer.2.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 453}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 457}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 458, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 459}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.decoder.block.0.layer.2.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 460}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 461}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 462, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 463}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2  3root.decoder.block.0.layer.2.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_53", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_53", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 464}2  ,root.decoder.block.1.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 465}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 466}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 467, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 468}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.decoder.block.1.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 469}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 470}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 471, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 472}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.decoder.block.1.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 473}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 474}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 475, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 476}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.decoder.block.1.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 477}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 478}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 479, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 480}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  2root.decoder.block.1.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_55", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_55", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 481}2  .root.decoder.block.1.layer.1.EncDecAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 482}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 483}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 484, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 485}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.decoder.block.1.layer.1.EncDecAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 486}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 487}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 488, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 489}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.decoder.block.1.layer.1.EncDecAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 490}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 491}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 492, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 493}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.decoder.block.1.layer.1.EncDecAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 494}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 495}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 496, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 497}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  4root.decoder.block.1.layer.1.EncDecAttention.dropout"_tf_keras_layer*{"name": "dropout_57", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_57", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 498}2  0root.decoder.block.1.layer.2.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 499}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 500}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 501, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 502}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  0root.decoder.block.1.layer.2.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 499}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 503}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 504, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 505}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  .root.decoder.block.1.layer.2.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 506}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 507}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 508, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 509}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2  3root.decoder.block.1.layer.2.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_59", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_59", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 510}2  ,root.decoder.block.2.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 511}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 512}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 513, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 514}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.decoder.block.2.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 515}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 516}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 517, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 518}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.decoder.block.2.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 519}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 520}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 521, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 522}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  ,root.decoder.block.2.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 523}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 524}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 525, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 526}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2  2root.decoder.block.2.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_61", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_61", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 527}2 .root.decoder.block.2.layer.1.EncDecAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 528}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 529}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 530, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 531}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.2.layer.1.EncDecAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 532}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 533}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 534, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 535}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.2.layer.1.EncDecAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 536}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 537}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 538, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 539}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.2.layer.1.EncDecAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 540}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 541}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 542, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 543}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 4root.decoder.block.2.layer.1.EncDecAttention.dropout"_tf_keras_layer*{"name": "dropout_63", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_63", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 544}2 0root.decoder.block.2.layer.2.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 545}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 546}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 547, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 548}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 0root.decoder.block.2.layer.2.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 545}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 549}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 550, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 551}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.2.layer.2.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 552}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 553}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 554, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 555}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2 3root.decoder.block.2.layer.2.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_65", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_65", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 556}2 ,root.decoder.block.3.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 557}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 558}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 559, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 560}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.3.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 561}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 562}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 563, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 564}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.3.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 565}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 566}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 567, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 568}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.3.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 569}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 570}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 571, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 572}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 2root.decoder.block.3.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_67", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_67", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 573}2 .root.decoder.block.3.layer.1.EncDecAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 574}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 575}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 576, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 577}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.3.layer.1.EncDecAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 578}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 579}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 580, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 581}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.3.layer.1.EncDecAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 582}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 583}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 584, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 585}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.3.layer.1.EncDecAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 586}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 587}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 588, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 589}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 4root.decoder.block.3.layer.1.EncDecAttention.dropout"_tf_keras_layer*{"name": "dropout_69", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_69", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 590}2 0root.decoder.block.3.layer.2.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 591}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 592}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 593, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 594}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 0root.decoder.block.3.layer.2.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 591}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 595}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 596, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 597}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.3.layer.2.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 598}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 599}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 600, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 601}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2 3root.decoder.block.3.layer.2.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_71", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_71", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 602}2 ,root.decoder.block.4.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 603}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 604}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 605, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 606}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.4.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 607}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 608}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 609, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 610}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.4.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 611}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 612}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 613, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 614}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.4.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 615}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 616}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 617, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 618}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 2root.decoder.block.4.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_73", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_73", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 619}2 .root.decoder.block.4.layer.1.EncDecAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 620}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 621}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 622, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 623}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.4.layer.1.EncDecAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 624}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 625}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 626, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 627}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.4.layer.1.EncDecAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 628}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 629}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 630, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 631}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.4.layer.1.EncDecAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 632}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 633}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 634, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 635}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 4root.decoder.block.4.layer.1.EncDecAttention.dropout"_tf_keras_layer*{"name": "dropout_75", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_75", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 636}2 0root.decoder.block.4.layer.2.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 637}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 638}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 639, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 640}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 0root.decoder.block.4.layer.2.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 637}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 641}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 642, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 643}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.4.layer.2.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 644}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 645}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 646, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 647}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2 3root.decoder.block.4.layer.2.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_77", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_77", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 648}2 ,root.decoder.block.5.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 649}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 650}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 651, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 652}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.5.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 653}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 654}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 655, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 656}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.5.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 657}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 658}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 659, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 660}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.5.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 661}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 662}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 663, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 664}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 2root.decoder.block.5.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_79", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_79", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 665}2 .root.decoder.block.5.layer.1.EncDecAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 666}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 667}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 668, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 669}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.5.layer.1.EncDecAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 670}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 671}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 672, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 673}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.5.layer.1.EncDecAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 674}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 675}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 676, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 677}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.5.layer.1.EncDecAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 678}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 679}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 680, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 681}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 4root.decoder.block.5.layer.1.EncDecAttention.dropout"_tf_keras_layer*{"name": "dropout_81", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_81", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 682}2 0root.decoder.block.5.layer.2.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 683}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 684}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 685, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 686}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 0root.decoder.block.5.layer.2.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 683}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 687}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 688, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 689}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.5.layer.2.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 690}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 691}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 692, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 693}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2 3root.decoder.block.5.layer.2.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_83", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_83", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 694}2 ,root.decoder.block.6.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 695}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 696}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 697, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 698}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.6.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 699}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 700}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 701, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 702}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.6.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 703}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 704}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 705, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 706}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.6.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 707}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 708}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 709, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 710}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 2root.decoder.block.6.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_85", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_85", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 711}2 .root.decoder.block.6.layer.1.EncDecAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 712}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 713}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 714, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 715}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.6.layer.1.EncDecAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 716}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 717}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 718, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 719}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.6.layer.1.EncDecAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 720}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 721}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 722, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 723}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.6.layer.1.EncDecAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 724}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 725}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 726, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 727}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 4root.decoder.block.6.layer.1.EncDecAttention.dropout"_tf_keras_layer*{"name": "dropout_87", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_87", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 728}2 0root.decoder.block.6.layer.2.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 729}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 730}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 731, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 732}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 0root.decoder.block.6.layer.2.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 729}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 733}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 734, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 735}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.6.layer.2.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 736}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 737}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 738, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 739}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2 3root.decoder.block.6.layer.2.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_89", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_89", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 740}2 ,root.decoder.block.7.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 741}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 742}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 743, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 744}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.7.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 745}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 746}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 747, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 748}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.7.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 749}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 750}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 751, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 752}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.7.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 753}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 754}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 755, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 756}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 2root.decoder.block.7.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_91", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_91", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 757}2 .root.decoder.block.7.layer.1.EncDecAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 758}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 759}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 760, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 761}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.7.layer.1.EncDecAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 762}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 763}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 764, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 765}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.7.layer.1.EncDecAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 766}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 767}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 768, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 769}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.7.layer.1.EncDecAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 770}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 771}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 772, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 773}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 4root.decoder.block.7.layer.1.EncDecAttention.dropout"_tf_keras_layer*{"name": "dropout_93", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_93", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 774}2 0root.decoder.block.7.layer.2.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 775}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 776}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 777, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 778}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 0root.decoder.block.7.layer.2.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 775}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 779}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 780, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 781}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.7.layer.2.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 782}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 783}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 784, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 785}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2 3root.decoder.block.7.layer.2.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_95", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_95", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 786}2 ,root.decoder.block.8.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 787}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 788}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 789, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 790}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.8.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 791}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 792}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 793, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 794}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.8.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 795}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 796}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 797, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 798}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.8.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 799}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 800}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 801, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 802}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 2root.decoder.block.8.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_97", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_97", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 803}2 .root.decoder.block.8.layer.1.EncDecAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 804}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 805}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 806, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 807}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.8.layer.1.EncDecAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 808}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 809}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 810, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 811}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.8.layer.1.EncDecAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 812}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 813}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 814, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 815}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.8.layer.1.EncDecAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 816}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 817}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 818, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 819}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 4root.decoder.block.8.layer.1.EncDecAttention.dropout"_tf_keras_layer*{"name": "dropout_99", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_99", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 820}2 0root.decoder.block.8.layer.2.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 821}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 822}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 823, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 824}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 0root.decoder.block.8.layer.2.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 821}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 825}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 826, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 827}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.8.layer.2.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 828}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 829}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 830, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 831}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2 3root.decoder.block.8.layer.2.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_101", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_101", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 832}2 ,root.decoder.block.9.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 833}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 834}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 835, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 836}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.9.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 837}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 838}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 839, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 840}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.9.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 841}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 842}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 843, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 844}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 ,root.decoder.block.9.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 845}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 846}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 847, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 848}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 2root.decoder.block.9.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_103", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_103", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 849}2 .root.decoder.block.9.layer.1.EncDecAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 850}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 851}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 852, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 853}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.9.layer.1.EncDecAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 854}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 855}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 856, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 857}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.9.layer.1.EncDecAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 858}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 859}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 860, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 861}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.9.layer.1.EncDecAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 862}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 863}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 864, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 865}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 4root.decoder.block.9.layer.1.EncDecAttention.dropout"_tf_keras_layer*{"name": "dropout_105", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_105", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 866}2 0root.decoder.block.9.layer.2.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 867}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 868}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 869, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 870}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 0root.decoder.block.9.layer.2.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 867}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 871}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 872, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 873}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 .root.decoder.block.9.layer.2.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 874}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 875}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 876, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 877}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2 3root.decoder.block.9.layer.2.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_107", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_107", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 878}2 -root.decoder.block.10.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 879}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 880}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 881, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 882}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 -root.decoder.block.10.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 883}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 884}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 885, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 886}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 -root.decoder.block.10.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 887}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 888}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 889, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 890}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 -root.decoder.block.10.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 891}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 892}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 893, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 894}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 3root.decoder.block.10.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_109", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_109", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 895}2 /root.decoder.block.10.layer.1.EncDecAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 896}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 897}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 898, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 899}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 /root.decoder.block.10.layer.1.EncDecAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 900}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 901}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 902, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 903}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 /root.decoder.block.10.layer.1.EncDecAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 904}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 905}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 906, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 907}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 /root.decoder.block.10.layer.1.EncDecAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 908}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 909}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 910, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 911}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 5root.decoder.block.10.layer.1.EncDecAttention.dropout"_tf_keras_layer*{"name": "dropout_111", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_111", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 912}2 1root.decoder.block.10.layer.2.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 913}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 914}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 915, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 916}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 1root.decoder.block.10.layer.2.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 913}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 917}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 918, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 919}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 /root.decoder.block.10.layer.2.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 920}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 921}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 922, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 923}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2 4root.decoder.block.10.layer.2.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_113", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_113", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 924}2 -root.decoder.block.11.layer.0.SelfAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 925}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 926}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 927, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 928}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 -root.decoder.block.11.layer.0.SelfAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 929}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 930}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 931, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 932}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 -root.decoder.block.11.layer.0.SelfAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 933}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 934}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 935, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 936}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 -root.decoder.block.11.layer.0.SelfAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 937}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 938}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 939, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 940}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 3root.decoder.block.11.layer.0.SelfAttention.dropout"_tf_keras_layer*{"name": "dropout_115", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_115", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 941}2 /root.decoder.block.11.layer.1.EncDecAttention.q"_tf_keras_layer*{"name": "q", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "q", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.004510548978043951, "seed": null}, "shared_object_id": 942}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 943}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 944, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 945}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 /root.decoder.block.11.layer.1.EncDecAttention.k"_tf_keras_layer*{"name": "k", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "k", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 946}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 947}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 948, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 949}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 /root.decoder.block.11.layer.1.EncDecAttention.v"_tf_keras_layer*{"name": "v", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "v", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 950}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 951}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 952, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 953}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 /root.decoder.block.11.layer.1.EncDecAttention.o"_tf_keras_layer*{"name": "o", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "o", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 954}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 955}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 956, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 957}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 5root.decoder.block.11.layer.1.EncDecAttention.dropout"_tf_keras_layer*{"name": "dropout_117", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_117", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 958}2 1root.decoder.block.11.layer.2.DenseReluDense.wi_0"_tf_keras_layer*{"name": "wi_0", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_0", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 959}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 960}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 961, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 962}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 1root.decoder.block.11.layer.2.DenseReluDense.wi_1"_tf_keras_layer*{"name": "wi_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wi_1", "trainable": true, "dtype": "float32", "units": 2048, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.03608439182435161, "seed": null}, "shared_object_id": 959}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 963}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 964, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 965}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 768]}}2 /root.decoder.block.11.layer.2.DenseReluDense.wo"_tf_keras_layer*{"name": "wo", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dense", "config": {"name": "wo", "trainable": true, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": false, "kernel_initializer": {"class_name": "RandomNormal", "config": {"mean": 0, "stddev": 0.02209708691207961, "seed": null}, "shared_object_id": 966}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 967}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 968, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 2048}}, "shared_object_id": 969}, "build_input_shape": {"class_name": "TensorShape", "items": [3, 5, 2048]}}2 4root.decoder.block.11.layer.2.DenseReluDense.dropout"_tf_keras_layer*{"name": "dropout_119", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "class_name": "Dropout", "config": {"name": "dropout_119", "trainable": true, "dtype": "float32", "rate": 0.1, "noise_shape": null, "seed": null}, "shared_object_id": 970}2