!2021 GPU add akg kernel greaterequal notequal

Merge pull request !2021 from VectorSL/gpu-add-akg-kernel
2020-06-12 15:14:47 +08:00 · 2020-06-12 15:14:47 +08:00 · 87fa15de80
parent 259341b9ba cf2fc1cecf
commit 87fa15de80
10 changed files with 317 additions and 2 deletions
--- a/mindspore/_akg/gpu/init.py
+++ b/mindspore/_akg/gpu/init.py
@ -35,3 +35,5 @@ from .logical_not import LogicalNot, gpu_schedule_LogicalNot
 from .logical_and import LogicalAnd, gpu_schedule_LogicalAnd
 from .sub import Sub, gpu_schedule_Sub
 from .less_equal import LessEqual, gpu_schedule_LessEqual
 from .notequal import NotEqual, gpu_schedule_NotEqual
 from .greater_equal import GreaterEqual, gpu_schedule_GreaterEqual
--- a/mindspore/_akg/gpu/greater_equal.py
+++ b/mindspore/_akg/gpu/greater_equal.py
@ -0,0 +1,41 @@
 # Copyright 2020 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 # http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """greater_equal"""
 import _akg.tvm
 from _akg.ops.math import greater_equal
 from _akg.topi.generic import schedule_elemwise
 def GreaterEqual(x, y):
    """GreaterEqual."""
    return greater_equal.greater_equal(x, y)
 def gpu_schedule_GreaterEqual(outs):
    """
    GPU schedule for GreaterEqual.
    Args:
        outs (tvm.tensor.Tensor): Outputs of compute.
    Returns:
        sch (schedule.Schedule): The created schedule.
    """
    device = 'cuda'
    ctx = _akg.tvm.context(device, 0)
    if not ctx.exist:
        raise SystemError("Skip because %s is not enabled" % device)
    with _akg.tvm.target.create(device):
        sch = schedule_elemwise(outs)
    return sch
--- a/mindspore/_akg/gpu/notequal.py
+++ b/mindspore/_akg/gpu/notequal.py
@ -0,0 +1,41 @@
 # Copyright 2020 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 # http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """notequal"""
 import _akg.tvm
 from _akg.ops.math import notequal
 from _akg.topi.generic import schedule_elemwise
 def NotEqual(x, y):
    """notequal."""
    return notequal.notequal(x, y)
 def gpu_schedule_NotEqual(outs):
    """
    gpu schedule for NotEqual.
    Args:
        outs (tvm.tensor.Tensor): outputs of compute.
    Returns:
        sch (schedule.Schedule): The created schedule.
    """
    device = 'cuda'
    ctx = _akg.tvm.context(device, 0)
    if not ctx.exist:
        raise SystemError("Skip because %s is not enabled" % device)
    with _akg.tvm.target.create(device):
        sch = schedule_elemwise(outs)
    return sch
--- a/mindspore/_akg/ops/math/greater_equal.py
+++ b/mindspore/_akg/ops/math/greater_equal.py
@ -0,0 +1,54 @@
 # Copyright 2020 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 # http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """operator dsl function: greaterequal"""
 import _akg.tvm
 import _akg.topi
 from _akg.utils.dsl_create import produce_shapes
 from _akg.utils import validation_check as vc_util
@vc_util.check_input_type(_akg.tvm.tensor.Tensor, _akg.tvm.tensor.Tensor)
 def greater_equal(input1, input2):
    """
    Check whether input1 greaterquals to input2.
    Args:
        input1 (tvm.tensor.Tensor): Tensor.
        input2 (tvm.tensor.Tensor): Tensor.
    Returns:
        tvm.tensor.Tensor. If input1 greaterquals to input2 return True, else return False.
    """
    shape1 = [x.value for x in input1.shape]
    shape2 = [x.value for x in input2.shape]
    vc_util.check_shape(shape1)
    vc_util.check_shape(shape2)
    shape1, shape2, shape = produce_shapes(shape1, shape2)
    vc_util.elemwise_dtype_check(input1.dtype, input2.dtype)
    dtype = input1.dtype
    # get greaterquals compute
    t_value = _akg.tvm.compute(shape, lambda *indice: _akg.tvm.const(1, dtype), "T")
    f_value = _akg.tvm.compute(shape, lambda *indice: _akg.tvm.const(0, dtype), "F")
    input1_bro = _akg.topi.broadcast_to(input1, shape)
    input2_bro = _akg.topi.broadcast_to(input2, shape)
    c_out = _akg.tvm.compute(shape, lambda *indice: _akg.tvm.expr.Select(input1_bro[indice] >= input2_bro[indice],
                                                                         t_value[indice], f_value[indice]), name="C")
    res = _akg.tvm.compute(shape, lambda *indice: c_out(*indice).astype("bool"), name="res")
    return res
--- a/mindspore/_akg/ops/math/notequal.py
+++ b/mindspore/_akg/ops/math/notequal.py
@ -0,0 +1,54 @@
 # Copyright 2020 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 # http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """operator dsl function: notequal"""
 import _akg.tvm
 import _akg.topi
 from _akg.utils.dsl_create import produce_shapes
 from _akg.utils import validation_check as vc_util
@vc_util.check_input_type(_akg.tvm.tensor.Tensor, _akg.tvm.tensor.Tensor)
 def notequal(input1, input2):
    """
    check whether input1 notequals to input2.
    Args:
        input1 (tvm.tensor.Tensor): Tensor.
        input2 (tvm.tensor.Tensor): Tensor.
    Returns:
        tvm.tensor.Tensor. If input1 notequal to input2 return True, else return False.
    """
    shape1 = [x.value for x in input1.shape]
    shape2 = [x.value for x in input2.shape]
    vc_util.check_shape(shape1)
    vc_util.check_shape(shape2)
    shape1, shape2, shape = produce_shapes(shape1, shape2)
    vc_util.elemwise_dtype_check(input1.dtype, input2.dtype)
    dtype = input1.dtype
    # get notequal compute
    t_value = _akg.tvm.compute(shape, lambda *indice: _akg.tvm.const(1, dtype), "T")
    f_value = _akg.tvm.compute(shape, lambda *indice: _akg.tvm.const(0, dtype), "F")
    input1_bro = _akg.topi.broadcast_to(input1, shape)
    input2_bro = _akg.topi.broadcast_to(input2, shape)
    c_out = _akg.tvm.compute(shape, lambda *indice: _akg.tvm.expr.Select(input1_bro[indice] != input2_bro[indice],
                                                                         t_value[indice], f_value[indice]), name="C")
    res = _akg.tvm.compute(shape, lambda *indice: c_out(*indice).astype("bool"), name="res")
    return res
--- a/mindspore/ops/_op_impl/akg/gpu/init.py
+++ b/mindspore/ops/_op_impl/akg/gpu/init.py
@ -32,3 +32,5 @@ from .logical_and import _logical_and_akg
 from .logical_not import _logical_not_akg
 from .logical_or import _logical_or_akg
 from .lessequal import _lessequal_akg
 from .notequal import _notequal_akg
 from .greater_equal import _greater_equal_akg
--- a/mindspore/ops/_op_impl/akg/gpu/greater_equal.py
+++ b/mindspore/ops/_op_impl/akg/gpu/greater_equal.py
@ -0,0 +1,32 @@
 # Copyright 2020 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 # http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """GreaterEqual op"""
 from mindspore.ops.op_info_register import op_info_register, AkgRegOp, DataType
 greater_equal_op_info = AkgRegOp("GreaterEqual") \
    .fusion_type("OPAQUE") \
    .input(0, "x") \
    .input(1, "y") \
    .output(0, "output") \
    .dtype_format(DataType.F16_Default, DataType.F16_Default, DataType.BOOL_Default) \
    .dtype_format(DataType.F32_Default, DataType.F32_Default, DataType.BOOL_Default) \
    .dtype_format(DataType.I32_Default, DataType.I32_Default, DataType.BOOL_Default) \
    .get_op_info()
@op_info_register(greater_equal_op_info)
 def _greater_equal_akg():
    """GreaterEqual register"""
    return
--- a/mindspore/ops/_op_impl/akg/gpu/lessequal.py
+++ b/mindspore/ops/_op_impl/akg/gpu/lessequal.py
@ -15,7 +15,7 @@
 """LessEqual op"""
 from mindspore.ops.op_info_register import op_info_register, AkgRegOp, DataType
-equal_op_info = AkgRegOp("LessEqual") \
+lessequal_op_info = AkgRegOp("LessEqual") \
    .fusion_type("OPAQUE") \
    .input(0, "x") \
    .input(1, "y") \
@ -26,7 +26,7 @@ equal_op_info = AkgRegOp("LessEqual") \
    .get_op_info()
-@op_info_register(equal_op_info)
+@op_info_register(lessequal_op_info)
 def _lessequal_akg():
    """LessEqual register"""
    return
--- a/mindspore/ops/_op_impl/akg/gpu/notequal.py
+++ b/mindspore/ops/_op_impl/akg/gpu/notequal.py
@ -0,0 +1,32 @@
 # Copyright 2020 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 # http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """NotEqual op"""
 from mindspore.ops.op_info_register import op_info_register, AkgRegOp, DataType
 notequal_op_info = AkgRegOp("NotEqual") \
    .fusion_type("OPAQUE") \
    .input(0, "x") \
    .input(1, "y") \
    .output(0, "output") \
    .dtype_format(DataType.F16_Default, DataType.F16_Default, DataType.BOOL_Default) \
    .dtype_format(DataType.F32_Default, DataType.F32_Default, DataType.BOOL_Default) \
    .dtype_format(DataType.I32_Default, DataType.I32_Default, DataType.BOOL_Default) \
    .get_op_info()
@op_info_register(notequal_op_info)
 def _notequal_akg():
    """NotEqual AutoDiff register"""
    return
--- a/tests/st/ops/gpu/test_equal_op.py
+++ b/tests/st/ops/gpu/test_equal_op.py
@ -30,6 +30,21 @@ class NetEqual(Cell):
    def construct(self, x, y):
        return self.Equal(x, y)
 class NetNotEqual(Cell):
    def __init__(self):
        super(NetNotEqual, self).__init__()
        self.NotEqual = P.NotEqual()
    def construct(self, x, y):
        return self.NotEqual(x, y)
 class NetGreaterEqual(Cell):
    def __init__(self):
        super(NetGreaterEqual, self).__init__()
        self.GreaterEqual = P.GreaterEqual()
    def construct(self, x, y):
        return self.GreaterEqual(x, y)
@pytest.mark.level0
@pytest.mark.platform_x86_gpu_training
@ -63,3 +78,45 @@ def test_equal():
    output1 = equal(x1, y1)
    assert np.all(output1.asnumpy() == expect1)
    assert output1.shape() == expect1.shape
@pytest.mark.level0
@pytest.mark.platform_x86_gpu_training
@pytest.mark.env_onecard
 def test_notequal():
    x0 = Tensor(np.array([[1.2, 1], [1, 0]]).astype(np.float32))
    y0 = Tensor(np.array([[1, 2]]).astype(np.float32))
    expect0 = np.array([[True, True], [False, True]])
    context.set_context(mode=context.PYNATIVE_MODE, device_target="GPU")
    notequal = NetNotEqual()
    output0 = notequal(x0, y0)
    assert np.all(output0.asnumpy() == expect0)
    assert output0.shape() == expect0.shape
    context.set_context(mode=context.GRAPH_MODE, device_target="GPU")
    notequal = NetNotEqual()
    output0 = notequal(x0, y0)
    assert np.all(output0.asnumpy() == expect0)
    assert output0.shape() == expect0.shape
@pytest.mark.level0
@pytest.mark.platform_x86_gpu_training
@pytest.mark.env_onecard
 def test_greaterqual():
    x0 = Tensor(np.array([[1.2, 1], [1, 0]]).astype(np.float32))
    y0 = Tensor(np.array([[1, 2]]).astype(np.float32))
    expect0 = np.array([[True, False], [True, False]])
    context.set_context(mode=context.PYNATIVE_MODE, device_target="GPU")
    gequal = NetGreaterEqual()
    output0 = gequal(x0, y0)
    assert np.all(output0.asnumpy() == expect0)
    assert output0.shape() == expect0.shape
    context.set_context(mode=context.GRAPH_MODE, device_target="GPU")
    gequal = NetGreaterEqual()
    output0 = gequal(x0, y0)
    assert np.all(output0.asnumpy() == expect0)
    assert output0.shape() == expect0.shape