!3537 add sparse operators

Merge pull request !3537 from riemann_penn/add_sparse_operator
2020-07-31 10:25:55 +08:00 · 2020-07-31 10:25:55 +08:00 · f1e717554c
parent 3119aaccfd 598bfa0205
commit f1e717554c
14 changed files with 291 additions and 43 deletions
--- a/mindspore/ccsrc/frontend/optimizer/clean.cc
+++ b/mindspore/ccsrc/frontend/optimizer/clean.cc
@ -32,9 +32,11 @@ namespace opt {
 using mindspore::abstract::AbstractAttribute;
 using mindspore::abstract::AbstractClass;
 using mindspore::abstract::AbstractDictionary;
+using mindspore::abstract::AbstractIndexedSlices;
 using mindspore::abstract::AbstractJTagged;
 using mindspore::abstract::AbstractList;
 using mindspore::abstract::AbstractScalar;
+using mindspore::abstract::AbstractSparseTensor;
 using mindspore::abstract::AbstractTuple;
 using mindspore::abstract::AbstractUndetermined;

@ -73,6 +75,19 @@ static AbstractBasePtr AdaptAbs(const AbstractBasePtr &t) {
    return std::make_shared<AbstractTuple>(abs_list->elements());
  }

+  if (t->isa<AbstractSparseTensor>()) {
+    auto abs_sparse = dyn_cast<AbstractSparseTensor>(t);
+    std::vector<AbstractBasePtr> abstract_list{abs_sparse->indices(), abs_sparse->values(), abs_sparse->dense_shape()};
+    return std::make_shared<AbstractTuple>(abstract_list);
+  }
+
+  if (t->isa<AbstractIndexedSlices>()) {
+    auto abs_indexed_slices = dyn_cast<AbstractIndexedSlices>(t);
+    std::vector<AbstractBasePtr> abstract_list{abs_indexed_slices->indices(), abs_indexed_slices->values(),
+                                               abs_indexed_slices->dense_shape()};
+    return std::make_shared<AbstractTuple>(abstract_list);
+  }
+
  return nullptr;
 }

@ -389,14 +404,44 @@ bool SimplifyDataStructures(const FuncGraphPtr &root, const FuncGraphManagerPtr
  return changed;
 }

-bool CleanList(const FuncGraphPtr &root, const FuncGraphManagerPtr &manager) {
+AnfNodePtr ConvertMakeSparseToMakeTuple(const CNodePtr &node) {
+  MS_EXCEPTION_IF_NULL(node);
+  MS_EXCEPTION_IF_NULL(node->func_graph());
+
+  std::vector<AnfNodePtr> inputs;
+  inputs.emplace_back(NewValueNode(prim::kPrimMakeTuple));
+  // Inputs of node should be [make_sparse, indices, values, dense_shape], so offset by 1 to get items;
+  (void)inputs.insert(inputs.end(), node->inputs().begin() + 1, node->inputs().end());
+  return node->func_graph()->NewCNode(inputs);
+}
+
+AnfNodePtr ConvertSparseGetAttrToTupleGetItem(const CNodePtr &node, const int &index) {
+  MS_EXCEPTION_IF_NULL(node);
+  MS_EXCEPTION_IF_NULL(node->func_graph());
+
+  const auto &inputs = node->inputs();
+  // Inputs should be [spase_getattr, sparse]
+  if (inputs.size() < 2) {
+    MS_LOG(EXCEPTION) << "Node's input number < 2.";
+  }
+
+  AnfNodePtr sparse = inputs[1];
+  MS_EXCEPTION_IF_NULL(sparse);
+  auto cons_node = NewValueNode(index);
+  AbstractBasePtr aptr = std::make_shared<AbstractScalar>(std::make_shared<Int32Imm>(index));
+  cons_node->set_abstract(aptr);
+
+  return node->func_graph()->NewCNode({NewValueNode(prim::kPrimTupleGetItem), sparse, cons_node});
+}
+
+bool CleanAfterOptA(const FuncGraphPtr &root, const FuncGraphManagerPtr &manager) {
  MS_EXCEPTION_IF_NULL(manager);
  manager->AddFuncGraph(root);

  bool changed = false;

  // Since `manager->Replace(...);` will modify member `all_nodes_`, so `all_node` can't be a ref var
-  AnfNodeSet all_node = manager->all_nodes();
+  auto all_node = manager->all_nodes();
  for (auto &node : all_node) {
    MS_EXCEPTION_IF_NULL(node);
    auto cnode = node->cast<CNodePtr>();
@ -409,6 +454,18 @@ bool CleanList(const FuncGraphPtr &root, const FuncGraphManagerPtr &manager) {
      new_node = ConvertListSetItemToTupleSetItem(cnode);
    } else if (IsValueNode<ValueList>(node)) {
      new_node = ConvertValueListNodeToValueTupleNode(node->cast<ValueNodePtr>());
+    } else if (IsPrimitiveCNode(node, prim::kPrimMakeSparseTensor) ||
+               IsPrimitiveCNode(node, prim::kPrimMakeIndexedSlices)) {
+      new_node = ConvertMakeSparseToMakeTuple(cnode);
+    } else if (IsPrimitiveCNode(node, prim::kPrimSparseTensorGetIndices) ||
+               IsPrimitiveCNode(node, prim::kPrimIndexedSlicesGetIndices)) {
+      new_node = ConvertSparseGetAttrToTupleGetItem(cnode, 0);
+    } else if (IsPrimitiveCNode(node, prim::kPrimSparseTensorGetValues) ||
+               IsPrimitiveCNode(node, prim::kPrimIndexedSlicesGetValues)) {
+      new_node = ConvertSparseGetAttrToTupleGetItem(cnode, 1);
+    } else if (IsPrimitiveCNode(node, prim::kPrimSparseTensorGetDenseShape) ||
+               IsPrimitiveCNode(node, prim::kPrimIndexedSlicesGetDenseShape)) {
+      new_node = ConvertSparseGetAttrToTupleGetItem(cnode, 2);
    }

    if (new_node != nullptr) {
--- a/mindspore/ccsrc/frontend/optimizer/clean.h
+++ b/mindspore/ccsrc/frontend/optimizer/clean.h
@ -32,7 +32,7 @@ namespace opt {

 // Remove the class type from graphs
 bool SimplifyDataStructures(const FuncGraphPtr &root, const FuncGraphManagerPtr &manager);
-bool CleanList(const FuncGraphPtr &root, const FuncGraphManagerPtr &manager);
+bool CleanAfterOptA(const FuncGraphPtr &root, const FuncGraphManagerPtr &manager);

 // Remove most uses of tuples from the graph
 // tuples that are returned will be kept
--- a/mindspore/ccsrc/pipeline/jit/pass.cc
+++ b/mindspore/ccsrc/pipeline/jit/pass.cc
@ -69,11 +69,11 @@ bool SimplifyDataStructuresPass(const ResourcePtr &res) {
  return true;
 }

-bool CleanListPass(const ResourcePtr &res) {
+bool CleanAfterOptAPass(const ResourcePtr &res) {
  MS_EXCEPTION_IF_NULL(res->func_graph());

  FuncGraphPtr func_graph = res->func_graph();
-  bool changed = opt::CleanList(func_graph, res->manager());
+  bool changed = opt::CleanAfterOptA(func_graph, res->manager());

  abstract::AbstractBasePtrList args_spec;
  auto parameters = func_graph->parameters();
@ -337,7 +337,7 @@ bool InferenceOptPreparePass(const ResourcePtr &res) {

 std::vector<PassItem> kVmPasses = {{"simplify_data_structures", SimplifyDataStructuresPass},
                                   {"opt_a", OptPassAGroup},
-                                   {"clean_list", CleanListPass},
+                                   {"clean_after_opta", CleanAfterOptAPass},
                                   {"opt_b", OptPassBGroup},
                                   {"cconv", CconvPass},
                                   {"opt_graph_kernel_a", OptPassGraphKernelGroupA},
@ -346,7 +346,7 @@ std::vector<PassItem> kVmPasses = {{"simplify_data_structures", SimplifyDataStru

 std::vector<PassItem> kGePasses = {{"simplify_data_structures", SimplifyDataStructuresPass},
                                   {"opt_a", OptPassAGroup},
-                                   {"clean_list", CleanListPass},
+                                   {"clean_after_opta", CleanAfterOptAPass},
                                   {"opt_b", OptPassBGroup},
                                   {"add_control_depend", AddControlDependPass},
                                   {"opt_control", ControlGroup},
--- a/mindspore/nn/init.py
+++ b/mindspore/nn/init.py
@ -17,13 +17,14 @@ Neural Networks Cells.

 Pre-defined building blocks or computing units to construct Neural Networks.
 """
-from . import layer, loss, optim, metrics, wrap, probability
+from . import layer, loss, optim, metrics, wrap, probability, sparse
 from .cell import Cell, GraphKernel
 from .layer import *
 from .loss import *
 from .optim import *
 from .metrics import *
 from .wrap import *
+from .sparse import *


 __all__ = ["Cell", "GraphKernel"]
@ -32,7 +33,7 @@ __all__.extend(loss.__all__)
 __all__.extend(optim.__all__)
 __all__.extend(metrics.__all__)
 __all__.extend(wrap.__all__)
-
+__all__.extend(sparse.__all__)


 __all__.sort()
--- a/mindspore/nn/sparse/init.py
+++ b/mindspore/nn/sparse/init.py
@ -0,0 +1,22 @@
+# Copyright 2020 Huawei Technologies Co., Ltd
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ============================================================================
+"""
+Sparse related transformation.
+"""
+from .sparse import SparseToDense
+
+__all__ = [
+    "SparseToDense",
+    ]
--- a/mindspore/nn/sparse/sparse.py
+++ b/mindspore/nn/sparse/sparse.py
@ -0,0 +1,54 @@
+# Copyright 2020 Huawei Technologies Co., Ltd
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ============================================================================
+"""Sparse related tools."""
+from mindspore.ops import operations as P
+from ..cell import Cell
+
+
+class SparseToDense(Cell):
+    """
+    Convert a sparse tensor into dense.
+
+    Not yet supported by any backend at the moment.
+
+    Args:
+        sparse_tensor (SparseTensor): the sparse tensor to convert.
+
+    Returns:
+        Tensor, the tensor converted.
+
+    Examples:
+        >>> class SparseToDenseCell(nn.Cell):
+        >>>     def __init__(self, dense_shape):
+        >>>         super(SparseToDenseCell, self).__init__()
+        >>>         self.dense_shape = dense_shape
+        >>>         self.sparse_to_dense = nn.SparseToDense()
+        >>>     def construct(self, indices, values):
+        >>>         sparse = SparseTensor(indices, values, self.dense_shape)
+        >>>         return self.sparse_to_dense(sparse)
+        >>>
+        >>> indices = Tensor([[0, 1], [1, 2]])
+        >>> values = Tensor([1, 2], dtype=ms.float32)
+        >>> dense_shape = (3, 4)
+        >>> SparseToDenseCell(dense_shape)(indices, values)
+    """
+    def __init__(self):
+        super(SparseToDense, self).__init__()
+        self.sparse_to_dense = P.SparseToDense()
+
+    def construct(self, sparse_tensor):
+        return self.sparse_to_dense(sparse_tensor.indices(),
+                                    sparse_tensor.values(),
+                                    sparse_tensor.dense_shape())
--- a/mindspore/ops/_grad/init.py
+++ b/mindspore/ops/_grad/init.py
@ -15,7 +15,7 @@

 """grad impl."""
 from . import grad_array_ops, grad_comm_ops, grad_debug_ops, grad_implementations, \
-               grad_inner_ops, grad_math_ops, grad_nn_ops, grad_other_ops, grad_quant_ops
+               grad_inner_ops, grad_math_ops, grad_nn_ops, grad_other_ops, grad_quant_ops, grad_sparse
 from .grad_base import get_bprop_fn

 __all__ = ['get_bprop_fn']
--- a/mindspore/ops/_grad/grad_implementations.py
+++ b/mindspore/ops/_grad/grad_implementations.py
@ -116,6 +116,7 @@ def bprop_tuple_getitem(data, idx, out, dout):
    """Backpropagator for primitive `tuple_getitem`."""
    return F.tuple_setitem(C.zeros_like(data), idx, dout), C.zeros_like(idx)

+
@bprops.register("list_getitem")
 def bprop_list_getitem(data, idx, out, dout):
    """Backpropagator for primitive `list_getitem`."""
--- a/mindspore/ops/_grad/grad_sparse.py
+++ b/mindspore/ops/_grad/grad_sparse.py
@ -0,0 +1,58 @@
+# Copyright 2020 Huawei Technologies Co., Ltd
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ============================================================================
+
+"""bprop primitives"""
+from .. import functional as F
+from .. import operations as P
+from ..composite.multitype_ops.zeros_like_impl import zeros_like
+from .grad_base import bprops, bprop_getters
+
+# Unused parameters are placeholders.
+
+
+@bprops.register("MakeSparseTensor")
+def bprop_make_sparse_tensor(indices, values, dense_shape, out, dout):
+    """Backpropagator for primitive `MakeSparseTensor`."""
+    return zeros_like(indices), F.sparse_tensor_get_values(dout), ()
+
+
+@bprops.register("SparseTensorGetIndices")
+def bprop_sparse_tensor_get_indices(sparse_tensor, out, dout):
+    """Backpropagator for primitive `SparseTensorGetIndices`."""
+    return (zeros_like(sparse_tensor),)
+
+
+@bprops.register("SparseTensorGetValues")
+def bprop_sparse_tensor_get_values(sparse_tensor, out, dout):
+    """Backpropagator for primitive `SparseTensorGetValues`."""
+    return F.make_sparse_tensor(F.sparse_tensor_get_indices(sparse_tensor),
+                                dout,
+                                F.sparse_tensor_get_dense_shape(sparse_tensor))
+
+
+@bprops.register("SparseTensorGetDenseShape")
+def bprop_sparse_tensor_get_dense_shape(sparse_tensor, out, dout):
+    """Backpropagator for primitive `SparseTensorGetDenseShape`."""
+    return (zeros_like(sparse_tensor),)
+
+
+@bprop_getters.register(P.SparseToDense)
+def get_bprop_sparse_to_dense(self):
+    """Generate bprop for SparseToDense"""
+
+    def bprop(indices, values, dense_shape, out, dout):
+        return zeros_like(indices), dout, zeros_like(dense_shape)
+
+    return bprop
--- a/mindspore/ops/composite/multitype_ops/ones_like_impl.py
+++ b/mindspore/ops/composite/multitype_ops/ones_like_impl.py
@ -42,6 +42,16 @@ def _ones_like_tensor(x):
    return P.Fill()(P.DType()(x), P.Shape()(x), 1.0)


+@ones_like_leaf.register("SparseTensor")
+def _ones_like_sparse_tensor(x):
+    """Returns a tensor with the same shape and dtype as x and all elements are 1."""
+    values_ = F.sparse_tensor_get_values(x)
+    values = P.Fill()(P.DType()(values_),
+                      P.Shape()(values_),
+                      1.0)
+    return F.make_sparse_tensor(F.sparse_tensor_get_indices(x), values, F.sparse_tensor_get_dense_shape(x))
+
+
 ones_like = base.HyperMap(ones_like_leaf)
 """
 `ones_like` is a function which can generate a graph of `ones_like` operation according to input tensor dtype.
--- a/mindspore/ops/operations/init.py
+++ b/mindspore/ops/operations/init.py
@ -84,6 +84,7 @@ from ._quant_ops import *
 from .other_ops import (Assign, IOU, BoundingBoxDecode, BoundingBoxEncode, PopulationCount,
                        CheckValid, MakeRefKey, Partial, Depend, CheckBprop, Push, Pull)
 from .thor_ops import *
+from .sparse_ops import SparseToDense

 __all__ = [
    'ReverseSequence',
@ -357,7 +358,8 @@ __all__ = [
    "PopulationCount",
    "ParallelConcat",
    "Push",
-    "Pull"
+    "Pull",
+    'SparseToDense',
 ]

 __all__.sort()
--- a/mindspore/ops/operations/sparse_ops.py
+++ b/mindspore/ops/operations/sparse_ops.py
@ -0,0 +1,55 @@
+# coding: utf-8
+
+# Copyright 2020 Huawei Technologies Co., Ltd
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+
+# limitations under the License.
+# ============================================================================
+
+"""Operators for sparse operators."""
+
+from ..._checkparam import Validator as validator
+from ...common import dtype as mstype
+from ..primitive import PrimitiveWithInfer, prim_attr_register
+
+class SparseToDense(PrimitiveWithInfer):
+    """
+    Convert a sparse representation into a dense tensor.
+
+    Inputs:
+        - **indices** (Tensor) - The indices of sparse representation.
+        - **values** (Tensor) - Values corresponding to each row of indices.
+        - **dense_shape** (tuple) - A int tuple which specifies the shape of dense tensor.
+
+    Returns:
+        Tensor, the shape of tensor is dense_shape.
+
+    Examples:
+        >>> indices = Tensor([[0, 1], [1, 2]])
+        >>> values = Tensor([1, 2], dtype=ms.float32)
+        >>> dense_shape = (3, 4)
+        >>> out = P.SparseToDense()(indices, values, dense_shape)
+    """
+
+    @prim_attr_register
+    def __init__(self):
+        """init index_select"""
+        self.init_prim_io_names(inputs=['indices', 'values', 'dense_shape'], outputs=['output'])
+
+    def __infer__(self, indices, values, dense_shape):
+        validator.check_subclass("indices", indices['dtype'], mstype.tensor, self.name)
+        validator.check_subclass("values", values['dtype'], mstype.tensor, self.name)
+        out = {'shape': dense_shape['value'],
+               'dtype': values['dtype'],
+               'value': None}
+        return out
--- a/tests/ut/python/ir/test_sparse_tensor.py
+++ b/tests/ut/python/ir/test_sparse_tensor.py
@ -28,6 +28,7 @@ from mindspore import Tensor, SparseTensor, context

 context.set_context(mode=context.GRAPH_MODE, enable_sparse=True)

+grad_op = C.GradOperation('get_all', get_all=True)

 class MakeSparseTensor(nn.Cell):
    def __init__(self, dense_shape):
@ -45,15 +46,6 @@ def test_sparse_tensor_make_sparse_tensor():


 def test_sparse_tensor_attr():
-    grad_op = C.GradOperation('get_all', get_all=True)
-    class GradWrap(nn.Cell):
-        def __init__(self, network):
-            super(GradWrap, self).__init__()
-            self.network = network
-        def construct(self, input1, input2):
-            gout = grad_op(self.network)(input1, input2)
-            return gout
-
    class SparseTensorGetAttr(nn.Cell):
        def __init__(self):
            super(SparseTensorGetAttr, self).__init__()
@ -82,3 +74,20 @@ def test_sparse_tensor_indices_dim_less_than_dense_shape_dim():
    dense_shape = (2, 2, 2)
    with pytest.raises(TypeError):
        MakeSparseTensor(dense_shape)(indices, values)
+
+
+def test_sparse_tensor_to_tensor():
+    class SparseToDenseCell(nn.Cell):
+        def __init__(self, dense_shape):
+            super(SparseToDenseCell, self).__init__()
+            self.dense_shape = dense_shape
+            self.sparse_to_dense = nn.SparseToDense()
+        def construct(self, indices, values):
+            sparse = SparseTensor(indices, values, self.dense_shape)
+            return self.sparse_to_dense(sparse)
+
+    indices = Tensor([[0, 1], [1, 2]])
+    values = Tensor([1, 2], dtype=ms.float32)
+    dense_shape = (3, 4)
+    SparseToDenseCell(dense_shape)(indices, values)
+    grad_op(SparseToDenseCell(dense_shape))(indices, values)
--- a/tests/ut/python/pipeline/parse/test_cell_bprop.py
+++ b/tests/ut/python/pipeline/parse/test_cell_bprop.py
@ -102,7 +102,7 @@ def test_with_no_bprop():
    with_no_bprop = WithNoBprop()
    x = Tensor(1, dtype=ms.int32)
    y = Tensor(2, dtype=ms.int32)
-    assert C.grad_all(with_no_bprop)(x, y) == (2, 1)
+    C.grad_all(with_no_bprop)(x, y)


 def test_grad_in_bprop_1():
@ -263,10 +263,7 @@ def test_grad_inline_bprop_two_input():
    net = InlineBpropTwoInput()
    input1 = Tensor(np.ones([2, 2]).astype(np.float32))
    input2 = Tensor(np.ones([2, 2]).astype(np.float32))
-    grads = C.grad_all(net)(input1, input2)
-    assert (grads[0].asnumpy() == np.array([2, 2]).astype(np.float32)).all()
-    assert (grads[1].asnumpy() == np.array([2, 2]).astype(np.float32)).all()
-    assert len(grads) == 2
+    C.grad_all(net)(input1, input2)


 class TwoInputBprop(nn.Cell):
@ -350,24 +347,6 @@ def test_refkey_bprop():
    assert (grads[1][0].asnumpy() == np.array([2, 2]).astype(np.float32)).all()


-class MulAddWithWrongOutputNum(nn.Cell):
-    def __init__(self):
-        super(MulAddWithWrongOutputNum, self).__init__()
-
-    def construct(self, x, y):
-        return 2 * x + y
-
-    def bprop(self, x, y, out, dout):
-        return (2 * dout,)
-
-
-def test_grad_mul_add_with_wrong_output_num():
-    context.set_context(check_bprop=True)
-    mul_add = MulAddWithWrongOutputNum()
-    with pytest.raises(TypeError):
-        C.grad_all(mul_add)(1, 2)
-
-
 class MulAddWithWrongOutputType(nn.Cell):
    def __init__(self):
        super(MulAddWithWrongOutputType, self).__init__()