mindnlp.abc.modules.decoder 源代码

# Copyright 2022 Huawei Technologies Co., Ltd
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ============================================================================
"""Decoder basic model"""

from mindspore import nn


[文档]class DecoderBase(nn.Cell):
    r"""
    Basic class for dedcoders

    Args:
        embedding (Cell): The embedding layer.
    """

    def __init__(self, embedding):
        super().__init__()
        self.embedding = embedding
        self.softmax = nn.Softmax()
        self.log_softmax = nn.LogSoftmax()

    def construct(self, prev_output_tokens, encoder_out=None):
        """
        Construct method.

        Args:
            prev_output_tokens (Tensor): output tokens for teacher forcing with shape [batch, tgt_len].
            encoder_out (Tensor): output of encoder. Defaults to None.

        Returns:
            Tensor, The result vector of decoder.
        """
        result = self.extract_features(prev_output_tokens, encoder_out)
        result = self.output_layer(result)
        return result

    def extract_features(self, prev_output_tokens, encoder_out=None):
        """
        Extract features of encoder output.

        Args:
            prev_output_tokens (Tensor): output tokens for teacher forcing with shape [batch, tgt_len].
            encoder_out (Tensor): output of encoder. Defaults to None.
        """
        raise NotImplementedError

    def output_layer(self, features):
        """
        Project features to the default output size.

        Args:
            features (Tensor): The extracted features.
        """
        raise NotImplementedError

    def get_normalized_probs(self, net_output, log_probs):
        """
        Get normalized probabilities from net's output.

        Args:
            net_output (tuple): The net's output.
            log_probs (bool): Decide whether to use log_softmax or softmax. If True, use log_softmax.
                If False, user softmax.

        Return:
            Tensor, the ormalized probabilities from net's output.
        """
        logits = net_output[0]
        if log_probs:
            result = self.log_softmax(logits)
        else:
            result = self.softmax(logits)
        return result