!30679 [MD] Add tests for Python Multiprocessing with AutoTune

Merge pull request !30679 from cathwong/ckw_ut_map_python_multiproc
2022-03-02 14:26:09 +00:00 · 2022-03-02 14:26:09 +00:00 · 4aa82cc21e
parent e5df0bba2d b151f90b8d
commit 4aa82cc21e
3 changed files with 294 additions and 2 deletions
--- a/tests/st/dataset/test_gpu_autotune.py
+++ b/tests/st/dataset/test_gpu_autotune.py
@ -14,11 +14,15 @@
 # ============================================================================

 import os
+import time
 import pytest
+import numpy as np

 import mindspore.dataset as ds
 import mindspore.dataset.transforms.c_transforms as C
+import mindspore.dataset.transforms.py_transforms as py_transforms
 import mindspore.dataset.vision.c_transforms as CV
+import mindspore.dataset.vision.py_transforms as py_vision

 from mindspore import context, nn
 from mindspore.common import dtype as mstype, set_seed
@ -30,6 +34,7 @@ def create_model():
    """
    Define and return a simple model
    """
+
    class Net(nn.Cell):
        def construct(self, x, y):
            return x
@ -79,6 +84,7 @@ def create_dataset(data_path, batch_size=32, repeat_size=1, num_parallel_workers
@pytest.mark.level0
@pytest.mark.platform_x86_gpu_training
@pytest.mark.env_onecard
+@pytest.mark.forked
 def test_autotune_train_simple_model():
    """
    Feature: Dataset AutoTune
@ -86,11 +92,13 @@ def test_autotune_train_simple_model():
    Expectation: Training completes successfully

    """
+    original_seed = ds.config.get_seed()
    set_seed(1)
    context.set_context(mode=context.GRAPH_MODE, device_target="GPU")
    context.set_context(enable_graph_kernel=True)

    # Enable Dataset AutoTune
+    original_autotune = ds.config.get_enable_autotune()
    ds.config.set_enable_autotune(True)

    ds_train = create_dataset(os.path.join("/home/workspace/mindspore_dataset/mnist", "train"), 32, 1)
@ -101,5 +109,84 @@ def test_autotune_train_simple_model():
    model.train(epoch_size, ds_train)
    print("Training is finished.")

-    # Disable Dataset AutoTune
-    ds.config.set_enable_autotune(False)
+    # Restore settings
+    ds.config.set_enable_autotune(original_autotune)
+    ds.config.set_seed(original_seed)
+
+
+def create_dataset_pyfunc_multiproc(data_path, batch_size=32, num_map_parallel_workers=1, max_rowsize=16):
+    """
+    Create dataset with Python ops list and python_multiprocessing=True for Map op
+    """
+
+    # Define dataset
+    data1 = ds.MnistDataset(data_path, num_parallel_workers=8)
+
+    data1 = data1.map(operations=[py_vision.ToType(np.int32)], input_columns="label",
+                      num_parallel_workers=num_map_parallel_workers,
+                      python_multiprocessing=True, max_rowsize=max_rowsize)
+
+    # Setup transforms list which include Python ops
+    transforms_list = [
+        py_vision.ToTensor(),
+        lambda x: x,
+        py_vision.HWC2CHW(),
+        py_vision.RandomErasing(0.9, value='random'),
+        py_vision.Cutout(4, 2),
+        lambda y: y
+    ]
+    compose_op = py_transforms.Compose(transforms_list)
+    data1 = data1.map(operations=compose_op, input_columns="image", num_parallel_workers=num_map_parallel_workers,
+                      python_multiprocessing=True, max_rowsize=max_rowsize)
+
+    # Apply Dataset Ops
+    data1 = data1.batch(batch_size, drop_remainder=True)
+
+    return data1
+
+
+@pytest.mark.level0
+@pytest.mark.platform_x86_gpu_training
+@pytest.mark.env_onecard
+@pytest.mark.forked
+def test_autotune_pymultiproc_train_simple_model():
+    """
+    Feature: Dataset AutoTune
+    Description: Test Dataset AutoTune with Python Multiprocessing for Training of a Simple Model
+    Expectation: Training completes successfully
+
+    """
+    original_seed = ds.config.get_seed()
+    set_seed(20)
+    context.set_context(mode=context.GRAPH_MODE, device_target="GPU")
+    context.set_context(enable_graph_kernel=True)
+
+    # Reduce memory required by disabling the shared memory optimization
+    mem_original = ds.config.get_enable_shared_mem()
+    ds.config.set_enable_shared_mem(False)
+
+    # Enable Dataset AutoTune
+    original_autotune = ds.config.get_enable_autotune()
+    ds.config.set_enable_autotune(True)
+    original_interval = ds.config.get_autotune_interval()
+    ds.config.set_autotune_interval(100)
+
+    ds_train = create_dataset_pyfunc_multiproc(os.path.join("/home/workspace/mindspore_dataset/mnist", "train"), 32, 2)
+    model = create_model()
+
+    print("Start Model Training.")
+    model_start = time.time()
+    epoch_size = 2
+    model.train(epoch_size, ds_train)
+    print("Model training is finished. Took {}s".format(time.time() - model_start))
+
+    # Restore settings
+    ds.config.set_autotune_interval(original_interval)
+    ds.config.set_enable_autotune(original_autotune)
+    ds.config.set_enable_shared_mem(mem_original)
+    ds.config.set_seed(original_seed)
+
+
+if __name__ == "__main__":
+    test_autotune_train_simple_model()
+    test_autotune_pymultiproc_train_simple_model()
--- a/tests/ut/python/dataset/test_minddataset_autotune.py
+++ b/tests/ut/python/dataset/test_minddataset_autotune.py
@ -16,6 +16,7 @@
 Testing Autotune support in DE for MindDataset
 """
 import os
+import pytest
 import mindspore.dataset as ds
 import mindspore.dataset.vision.c_transforms as vision
 from mindspore.dataset.vision import Inter
@ -23,6 +24,7 @@ from util_minddataset import add_and_remove_cv_file


 # pylint: disable=unused-variable, redefined-outer-name
+@pytest.mark.forked
 def test_autotune_simple_pipeline_mindrecord(add_and_remove_cv_file):
    """
    Feature: Autotuning
--- a/tests/ut/python/dataset/test_pyfunc_multiprocess_autotune.py
+++ b/tests/ut/python/dataset/test_pyfunc_multiprocess_autotune.py
@ -0,0 +1,203 @@
+# Copyright 2022 Huawei Technologies Co., Ltd
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""
+Test Python Multiprocessing with AutoTuning
+"""
+import numpy as np
+import pytest
+import mindspore.dataset as ds
+import mindspore.dataset.transforms.c_transforms as c_transforms
+import mindspore.dataset.transforms.py_transforms as py_transforms
+import mindspore.dataset.vision.c_transforms as c_vision
+import mindspore.dataset.vision.py_transforms as py_vision
+from mindspore.dataset.vision import Inter
+
+DATA_DIR = "../data/dataset/testCifar10Data"
+
+
+def create_pyfunc_dataset(batch_size=32, repeat_size=1, num_parallel_workers=1, num_samples=None):
+    """
+    Create Cifar10 dataset pipline with Map ops containing only Python functions and Python Multiprocessing enabled
+    """
+
+    # Define dataset
+    cifar10_ds = ds.Cifar10Dataset(DATA_DIR, num_samples=num_samples)
+
+    cifar10_ds = cifar10_ds.map(operations=[py_vision.ToType(np.int32)], input_columns="label",
+                                num_parallel_workers=num_parallel_workers, python_multiprocessing=True)
+
+    # Setup transforms list which include Python ops / Pyfuncs
+    transforms_list = [
+        py_vision.ToPIL(),
+        py_vision.RandomGrayscale(prob=0.2),
+        np.array]  # need to convert PIL image to a NumPy array to pass it to C++ operation
+    compose_op = py_transforms.Compose(transforms_list)
+    cifar10_ds = cifar10_ds.map(operations=compose_op, input_columns="image",
+                                num_parallel_workers=num_parallel_workers,
+                                python_multiprocessing=True)
+
+    # Apply Dataset Ops
+    buffer_size = 10000
+    cifar10_ds = cifar10_ds.shuffle(buffer_size=buffer_size)
+    cifar10_ds = cifar10_ds.batch(batch_size, drop_remainder=True)
+    cifar10_ds = cifar10_ds.repeat(repeat_size)
+
+    return cifar10_ds
+
+
+def create_pyop_cop_dataset(batch_size=32, repeat_size=1, num_parallel_workers=1, num_samples=None):
+    """
+    Create Cifar10 dataset pipeline with Map ops containing just C Ops or just Pyfuncs
+    """
+
+    # Define dataset
+    cifar10_ds = ds.Cifar10Dataset(DATA_DIR, num_samples=num_samples)
+
+    # Map#1 - with Pyfunc
+    cifar10_ds = cifar10_ds.map(operations=[py_vision.ToType(np.int32)], input_columns="label",
+                                num_parallel_workers=num_parallel_workers, python_multiprocessing=True)
+
+    # Map#2 - with C Ops
+    resize_height, resize_width = 32, 32
+    rescale = 1.0 / 255.0
+    shift = 0.0
+    rescale_nml = 1 / 0.3081
+    shift_nml = -1 * 0.1307 / 0.3081
+    resize_op = c_vision.Resize((resize_height, resize_width), interpolation=Inter.LINEAR)
+    rescale_op = c_vision.Rescale(rescale, shift)
+    rescale_nml_op = c_vision.Rescale(rescale_nml, shift_nml)
+    hwc2chw_op = c_vision.HWC2CHW()
+    transforms = [resize_op, rescale_op, rescale_nml_op, hwc2chw_op]
+    compose_op = c_transforms.Compose(transforms)
+    cifar10_ds = cifar10_ds.map(operations=compose_op, input_columns="image",
+                                num_parallel_workers=num_parallel_workers,
+                                python_multiprocessing=True)
+
+    # Map#3 - with Pyfunc
+    transforms_list = [lambda x: x]
+    compose_op = py_transforms.Compose(transforms_list)
+    cifar10_ds = cifar10_ds.map(operations=compose_op, input_columns="image",
+                                num_parallel_workers=num_parallel_workers,
+                                python_multiprocessing=True)
+
+    # Apply Dataset Ops
+    buffer_size = 10000
+    cifar10_ds = cifar10_ds.shuffle(buffer_size=buffer_size)
+    cifar10_ds = cifar10_ds.batch(batch_size, drop_remainder=True)
+    cifar10_ds = cifar10_ds.repeat(repeat_size)
+
+    return cifar10_ds
+
+
+def create_mixed_map_dataset(batch_size=32, repeat_size=1, num_parallel_workers=1, num_samples=None):
+    """
+    Create Cifar10 dataset pipeline with a Map op containing of both C Ops and Pyfuncs
+    """
+
+    # Define dataset
+    cifar10_ds = ds.Cifar10Dataset(DATA_DIR, num_samples=num_samples)
+
+    cifar10_ds = cifar10_ds.map(operations=[py_vision.ToType(np.int32)], input_columns="label",
+                                num_parallel_workers=num_parallel_workers, python_multiprocessing=True)
+
+    # Map with operations: Pyfunc + C Ops + Pyfunc
+    resize_op = c_vision.Resize((32, 32), interpolation=Inter.LINEAR)
+    rescale_op = c_vision.Rescale(1.0 / 255.0, 0.0)
+    rescale_nml_op = c_vision.Rescale(1 / 0.3081, -1 * 0.1307 / 0.3081)
+    hwc2chw_op = c_vision.HWC2CHW()
+    cifar10_ds = cifar10_ds.map(
+        operations=[lambda x: x, resize_op, rescale_op, rescale_nml_op, hwc2chw_op, lambda y: y],
+        input_columns="image", num_parallel_workers=num_parallel_workers,
+        python_multiprocessing=True)
+
+    # Apply Dataset Ops
+    buffer_size = 10000
+    cifar10_ds = cifar10_ds.shuffle(buffer_size=buffer_size)
+    cifar10_ds = cifar10_ds.batch(batch_size, drop_remainder=True)
+    cifar10_ds = cifar10_ds.repeat(repeat_size)
+
+    return cifar10_ds
+
+
+@pytest.mark.forked
+class TestPythonMultiprocAutotune:
+
+    def setup_method(self):
+        """
+        Run before each test function.
+        """
+        # Reduce memory required by disabling the shared memory optimization
+        self.mem_original = ds.config.get_enable_shared_mem()
+        ds.config.set_enable_shared_mem(False)
+
+    def teardown_method(self):
+        """
+        Run after each test function.
+        """
+        ds.config.set_enable_shared_mem(self.mem_original)
+
+    @staticmethod
+    def test_cifar10_pyfunc_pipeline():
+        """
+        Feature: Python Multiprocessing with AutoTune
+        Description: Test pipeline with Map ops containing only Python function
+        Expectation: Data pipeline executes successfully with correct number of rows
+        """
+        # Note: Set num_parallel_workers to minimum of 1
+        mydata1 = create_pyfunc_dataset(32, 1, num_parallel_workers=1, num_samples=400)
+        mycount1 = 0
+        for _ in mydata1.create_dict_iterator(num_epochs=1):
+            mycount1 += 1
+        assert mycount1 == 12
+
+    @staticmethod
+    def test_cifar10_pyfunc_pipeline_all_samples():
+        """
+        Feature: Python Multiprocessing with AutoTune
+        Description: Test pipeline with Map ops containing only Python function, with all samples in dataset
+        Expectation: Data pipeline executes successfully with correct number of rows
+        """
+        # Note: Use all samples
+        mydata1 = create_pyfunc_dataset(32, 1, num_parallel_workers=8)
+        mycount1 = 0
+        for _ in mydata1.create_dict_iterator(num_epochs=1):
+            mycount1 += 1
+        assert mycount1 == 312
+
+    @staticmethod
+    def test_cifar10_pyop_cop_pipeline():
+        """
+        Feature: Python Multiprocessing with AutoTune
+        Description: Test pipeline with Map ops containing just C Ops or just Pyfuncs
+        Expectation: Data pipeline executes successfully with correct number of rows
+        """
+        mydata1 = create_pyop_cop_dataset(16, 1, num_parallel_workers=4, num_samples=600)
+        mycount1 = 0
+        for _ in mydata1.create_dict_iterator(num_epochs=1):
+            mycount1 += 1
+        assert mycount1 == 37
+
+    @staticmethod
+    def test_cifar10_mixed_map_pipeline():
+        """
+        Feature: Python Multiprocessing with AutoTune
+        Description: Test pipeline with a Map op containing of both C Ops and Pyfuncs
+        Expectation: Data pipeline executes successfully with correct number of rows
+        """
+        mydata1 = create_mixed_map_dataset(32, 2, num_parallel_workers=12, num_samples=500)
+        mycount1 = 0
+        for _ in mydata1.create_dict_iterator(num_epochs=1):
+            mycount1 += 1
+        assert mycount1 == 30