!41988 add strided_slice and KLDivLoss interface

Merge pull request !41988 from 范吉斌/add_interface
2022-09-15 14:05:09 +00:00 · 2022-09-15 14:05:09 +00:00 · cc826879ef
parent 221367ef6f 5e7f2f9cb9
commit cc826879ef
7 changed files with 210 additions and 3 deletions
--- a/mindspore/python/mindspore/nn/loss/init.py
+++ b/mindspore/python/mindspore/nn/loss/init.py
@ -23,10 +23,10 @@ from __future__ import absolute_import
 from mindspore.nn.loss.loss import LossBase, L1Loss, MSELoss, SmoothL1Loss, SoftMarginLoss, FocalLoss,\
    SoftmaxCrossEntropyWithLogits, BCELoss, MultiMarginLoss, CosineEmbeddingLoss, \
    SampledSoftmaxLoss, DiceLoss, BCEWithLogitsLoss, MultiClassDiceLoss,\
-    RMSELoss, MAELoss, HuberLoss, CrossEntropyLoss, NLLLoss
+    RMSELoss, MAELoss, HuberLoss, CrossEntropyLoss, NLLLoss, KLDivLoss


 __all__ = ['LossBase', 'L1Loss', 'MSELoss', 'SmoothL1Loss', 'SoftMarginLoss', 'FocalLoss',
           'SoftmaxCrossEntropyWithLogits', 'BCELoss', 'BCEWithLogitsLoss', 'MultiMarginLoss',
           'CosineEmbeddingLoss', 'SampledSoftmaxLoss', 'DiceLoss', 'MultiClassDiceLoss',
-           'RMSELoss', 'MAELoss', 'HuberLoss', 'CrossEntropyLoss', 'NLLLoss']
+           'RMSELoss', 'MAELoss', 'HuberLoss', 'CrossEntropyLoss', 'NLLLoss', 'KLDivLoss']
--- a/mindspore/python/mindspore/nn/loss/loss.py
+++ b/mindspore/python/mindspore/nn/loss/loss.py
@ -2079,3 +2079,69 @@ class CrossEntropyLoss(LossBase):
        if logits.ndim == labels.ndim and self.ignore_index > 0:
            _cross_entropy_ignore_index_warning(self.cls_name)
        return F.cross_entropy(logits, labels, self.weight, self.ignore_index, self.reduction, self.label_smoothing)
+
+
+class KLDivLoss(LossBase):
+    r"""
+    Computes the Kullback-Leibler divergence between the logits and the labels.
+
+    The updating formulas of KLDivLoss algorithm are as follows,
+
+    .. math::
+        L = \{l_1,\dots,l_N\}^\top, \quad
+        l_n = target_n \cdot (\log target_n - x_n)
+
+    Then,
+
+    .. math::
+        \ell(x, target) = \begin{cases}
+        L, & \text{if reduction} = \text{'none';}\\
+        \operatorname{mean}(L), & \text{if reduction} = \text{'mean';}\\
+        \operatorname{batchmean}(L), & \text{if reduction} = \text{'batchmean';}\\
+        \operatorname{sum}(L),  & \text{if reduction} = \text{'sum'.}
+        \end{cases}
+
+    where :math:`x` represents `logits`.
+    :math:`target` represents `labels`.
+    :math:`\ell(x, target)` represents `output`.
+
+    Note:
+        Currently it does not support float64 input on `Ascend`.
+        It behaves the same as the mathematical definition only when `reduction` is set to `batchmean`.
+
+    Args:
+        reduction (str): Specifies the reduction to be applied to the output.
+            Its value must be one of 'none', 'mean', 'batchmean' or 'sum'. Default: 'mean'.
+
+    Inputs:
+        - **logits** (Tensor) - The input Tensor. The data type must be float16, float32 or float64.
+        - **labels** (Tensor) - The label Tensor which has the same shape and data type as `logits`.
+
+    Returns:
+        Tensor or Scalar, if `reduction` is 'none', then output is a tensor and has the same shape as `logits`.
+        Otherwise, it is a scalar.
+
+    Raises:
+        TypeError: If `reduction` is not a str.
+        TypeError: If neither `logits` nor `labels` is a Tensor.
+        TypeError: If dtype of `logits` or `labels` is not float32.
+
+    Supported Platforms:
+        ``Ascend`` ``GPU`` ``CPU``
+
+    Examples:
+        >>> logits = Tensor(np.array([0.2, 0.7, 0.1]), mindspore.float32)
+        >>> labels = Tensor(np.array([0., 1., 0.]), mindspore.float32)
+        >>> loss = nn.KLDivLoss(reduction='mean')
+        >>> output = loss(logits, labels)
+        >>> print(output)
+        -0.23333333
+    """
+    def __init__(self, reduction='mean'):
+        super().__init__()
+        self.reduction = reduction
+
+    def construct(self, logits, labels):
+        _check_is_tensor('logits', logits, self.cls_name)
+        _check_is_tensor('labels', labels, self.cls_name)
+        return F.kl_div(logits, labels, self.reduction)
--- a/mindspore/python/mindspore/ops/function/init.py
+++ b/mindspore/python/mindspore/ops/function/init.py
@ -51,6 +51,7 @@ from .array_func import (
    stack,
    unstack,
    tensor_slice,
+    strided_slice,
    slice,
    scalar_to_array,
    scalar_to_tensor,
--- a/mindspore/python/mindspore/ops/function/array_func.py
+++ b/mindspore/python/mindspore/ops/function/array_func.py
@ -1060,6 +1060,108 @@ def select(cond, x, y):
    return tensor_select_(cond, input_x, input_y)


+def strided_slice(input_x, begin, end, strides):
+    r"""
+    Extracts a strided slice of a tensor.
+
+    This operation extracts a fragment of size (end-begin)/stride from the given 'input_tensor'.
+    Starting from the beginning position, the fragment continues adding stride to the index until
+    all dimensions are not less than the ending position.
+
+    Note:
+        The stride may be negative value, which causes reverse slicing.
+        The shape of `begin`, `end` and `strides` must be the same.
+        `begin` and `end` are zero-indexed. The element of `strides` must be non-zero.
+
+    Args:
+        input_x (Tensor): The input Tensor.
+        begin (tuple[int]): A tuple which represents the location where to start. Only
+          constant value is allowed.
+        end (tuple[int]): A tuple or which represents the maximum location where to end.
+          Only constant value is allowed.
+        strides (tuple[int]): - A tuple which represents the stride is continuously added
+          before reaching the maximum location. Only constant value is allowed.
+
+    Returns:
+        Tensor, The output is explained by following example.
+
+        In the 0th dimension, begin is 1, end is 2, and strides is 1,
+        because :math:`1+1=2\geq2`, the interval is :math:`[1,2)`.
+        Thus, return the element with :math:`index = 1` in 0th dimension, i.e., [[3, 3, 3], [4, 4, 4]].
+
+        In the 1st dimension, similarly, the interval is :math:`[0,1)`.
+        Based on the return value of the 0th dimension, return the element with :math:`index = 0`,
+        i.e., [3, 3, 3].
+
+        In the 2nd dimension, similarly, the interval is :math:`[0,3)`.
+        Based on the return value of the 1st dimension, return the element with :math:`index = 0,1,2`,
+        i.e., [3, 3, 3].
+
+        Finally, the output is [3, 3, 3].
+
+    Raises:
+        TypeError: If `begin`, `end` or `strides` is not a tuple.
+
+    Supported Platforms:
+        ``Ascend`` ``GPU`` ``CPU``
+
+    Examples:
+        >>> input_x = Tensor([[[1, 1, 1], [2, 2, 2]], [[3, 3, 3], [4, 4, 4]],
+        ...                   [[5, 5, 5], [6, 6, 6]]], mindspore.float32)
+        >>> output = ops.strided_slice(input_x, (1, 0, 2), (3, 1, 3), (1, 1, 1))
+        >>> # Take this " output = strided_slice(input_x, (1, 0, 2), (3, 1, 3), (1, 1, 1)) " as an example,
+        >>> # start = [1, 0, 2] , end = [3, 1, 3], stride = [1, 1, 1], Find a segment of (start, end),
+        >>> # note that end is an open interval
+        >>> # To facilitate understanding, this operator can be divided into three steps:
+        >>> # Step 1: Calculation of the first dimension:
+        >>> # start = 1, end = 3, stride = 1, So can take 1st, 2nd rows, and then gets the final output at this time.
+        >>> # output_1th =
+        >>> # [
+        >>> #     [
+        >>> #         [3,3,3]
+        >>> #         [4,4,4]
+        >>> #     ]
+        >>> #     [
+        >>> #         [5,5,5]
+        >>> #         [6,6,6]
+        >>> #     ]
+        >>> # ]
+        >>> # Step 2: Calculation of the second dimension
+        >>> # 2nd dimension, start = 0, end = 1, stride = 1. So only 0th rows can be taken, and the output at this time.
+        >>> # output_2nd =
+        >>> # [
+        >>> #     [
+        >>> #         [3,3,3]
+        >>> #     ]
+        >>> #     [
+        >>> #         [5,5,5]
+        >>> #     ]
+        >>> # ]
+        >>> # Step 3: Calculation of the third dimension
+        >>> # 3nd dimension,start = 2, end = 3, stride = 1, So can take 2th cols,
+        >>> # and you get the final output at this time.
+        >>> # output_3ed =
+        >>> # [
+        >>> #     [
+        >>> #         [3]
+        >>> #     ]
+        >>> #     [
+        >>> #         [5]
+        >>> #     ]
+        >>> # ]
+        >>> # The final output after finishing is:
+        >>> print(output)
+        [[[3.]]
+         [[5.]]]
+        >>> # another example like :
+        >>> output = strided_slice(input_x, (1, 0, 0), (2, 1, 3), (1, 1, 1))
+        >>> print(output)
+        [[[3. 3. 3.]]]
+    """
+    strided_slice_ = _get_cache_prim(P.StridedSlice)()
+    return strided_slice_(input_x, begin, end, strides)
+
+
 def slice(input_x, begin, size):
    r"""
    Slices a tensor in the specified shape.
@ -4311,6 +4413,7 @@ __all__ = [
    'reshape_',
    'flatten',
    'tensor_slice',
+    'strided_slice',
    'slice',
    'concat',
    'stack',
--- a/mindspore/python/mindspore/ops/functional.py
+++ b/mindspore/python/mindspore/ops/functional.py
@ -52,7 +52,6 @@ isinstance_ = P.IsInstance()

 merge = P.Merge()
 geswitch = P.GeSwitch()
-strided_slice = P.StridedSlice()
 check_bprop = P.CheckBprop()
 sqrt = P.Sqrt()
 reduce_sum = P.ReduceSum()
--- a/tests/st/ops/cpu/test_kl_div_op.py
+++ b/tests/st/ops/cpu/test_kl_div_op.py
@ -211,3 +211,24 @@ def test_mode_batchmean_and_dtype_with_dynamic_input(mode, dtype):
    loss = net(Tensor(prediction), Tensor(target))
    expect = np.array([0.52491106]).astype(dtype)
    assert np.allclose(loss.asnumpy(), expect)
+
+
+@pytest.mark.level0
+@pytest.mark.platform_x86_cpu
+@pytest.mark.env_onecard
+@pytest.mark.parametrize("mode", [context.GRAPH_MODE, context.PYNATIVE_MODE])
+@pytest.mark.parametrize("dtype", [np.float16, np.float32, np.float64])
+def test_mode_batchmean_with_nn_interface(mode, dtype):
+    """
+    Feature: test batchmean mode with nn interface.
+    Description: test batchmean mode with nn interface.
+    Expectation: success.
+    """
+    context.set_context(mode=mode)
+    np.random.seed(42)
+    prediction = mindspore.Tensor(np.log(np.array([[0.3, 0.7], [0.5, 0.5]])).astype(dtype))
+    target = mindspore.Tensor(np.array([[-1, 1], [1, -1]]).astype(dtype))
+    net = nn.KLDivLoss("batchmean")
+    loss = net(Tensor(prediction), Tensor(target))
+    expect = np.array([0.52491106]).astype(dtype)
+    assert np.allclose(loss.asnumpy(), expect)
--- a/tests/st/ops/cpu/test_stridedslice_op.py
+++ b/tests/st/ops/cpu/test_stridedslice_op.py
@ -19,6 +19,7 @@ import pytest
 import mindspore.context as context
 import mindspore.nn as nn
 from mindspore import Tensor
+from mindspore import ops
 from mindspore.ops import operations as P
 from mindspore.ops.functional import vmap

@ -61,3 +62,19 @@ def test_slice_vmap():
    output = stridedslice_vmap(x)
    expect = np.ones((16, 1, 2, 3))
    assert np.allclose(output.asnumpy(), expect)
+
+
+@pytest.mark.level0
+@pytest.mark.platform_x86_cpu
+@pytest.mark.env_onecard
+def test_slice_functional():
+    """
+    Feature: Test strided_slice functional interface.
+    Description: Test strided_slice functional interface.
+    Expectation: success.
+    """
+    x = Tensor(np.array([[[1., 1., 1.], [2, 2, 2]], [[3, 3, 3], [4, 4, 4]], [[5, 5, 5], [6, 7, 8]]]).astype(np.float32))
+    output = ops.strided_slice(x, (2, 0, 0), (3, 2, 3), (1, 1, 1))
+    expect = [[[5., 5., 5.],
+               [6., 7., 8.]]]
+    assert (output.asnumpy() == expect).all()