Source code for transformers.models.blenderbot.modeling_tf_blenderbot

# coding=utf-8
# Copyright 2020 The Facebook AI Research Team Authors and The HuggingFace Inc. team.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""TF BlenderBot model, ported from the fairseq repo."""

import tensorflow as tf

from ...file_utils import add_start_docstrings
from ...utils import logging
from ..bart.modeling_tf_bart import BART_START_DOCSTRING, LARGE_NEGATIVE, TFBartForConditionalGeneration
from .configuration_blenderbot import BlenderbotConfig


_CONFIG_FOR_DOC = "BlenderbotConfig"

START_DOCSTRING = BART_START_DOCSTRING.replace(
    "inherits from :class:`~transformers.TFPreTrainedModel`",
    "inherits from :class:`~transformers.TFBartForConditionalGeneration`",
).replace("BartConfig", _CONFIG_FOR_DOC)


logger = logging.get_logger(__name__)


[docs]@add_start_docstrings("Blenderbot model for open domain dialogue", START_DOCSTRING) class TFBlenderbotForConditionalGeneration(TFBartForConditionalGeneration): config_class = BlenderbotConfig
[docs] def adjust_logits_during_generation(self, logits, cur_len, max_length): """Never predict pad_token_id. Predict </s> when max_length is reached.""" vocab_range = tf.constant(range(self.config.vocab_size)) logits = tf.where(vocab_range == self.config.pad_token_id, LARGE_NEGATIVE, logits) if cur_len == max_length - 1: logits = tf.where(vocab_range != self.config.eos_token_id, LARGE_NEGATIVE, logits) return logits