!9071 add testcase for ps

From: @chopin_syp Reviewed-by: @cristoval,@limingqi107 Signed-off-by: @limingqi107
5 years ago · 32aa790f43
parent ebef1df00b c191deff1d
commit 32aa790f43
3 changed files with 265 additions and 0 deletions
--- a/tests/st/ps/part_ps/shell_run_test.sh
+++ b/tests/st/ps/part_ps/shell_run_test.sh
@ -0,0 +1,56 @@
 #!/bin/bash
 # Copyright 2020 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 # http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ============================================================================
 execute_path=$(pwd)
 self_path=$(dirname "${script_self}")
 export MS_COMM_TYPE=zmq
 export MS_SCHED_NUM=1
 DEVICE_TARGET=$1
 DATASET_PATH=$2
 export MS_WORKER_NUM=$3
 export MS_SERVER_NUM=$4
 export MS_SCHED_HOST=$5
 export MS_SCHED_PORT=$6
 export MS_ROLE=MS_SCHED
 for((i=0;i<1;i++));
 do
  rm -rf ${execute_path}/sched_$i/
  mkdir ${execute_path}/sched_$i/
  cd ${execute_path}/sched_$i/ || exit
  python ${self_path}/../test_ps_embedding_heterogeneous_conv2d_adam.py --device_target=$DEVICE_TARGET --dataset_path=$DATASET_PATH &
 done
 export MS_ROLE=MS_PSERVER
 for((i=0;i<$MS_SERVER_NUM;i++));
 do
  rm -rf ${execute_path}/server_$i/
  mkdir ${execute_path}/server_$i/
  cd ${execute_path}/server_$i/ || exit
  python ${self_path}/../test_ps_embedding_heterogeneous_conv2d_adam.py --device_target=$DEVICE_TARGET --dataset_path=$DATASET_PATH &
 done
 export MS_ROLE=MS_WORKER
 for((i=0;i<$MS_WORKER_NUM;i++));
 do
  rm -rf ${execute_path}/worker_$i/
  mkdir ${execute_path}/worker_$i/
  cd ${execute_path}/worker_$i/ || exit
  python ${self_path}/../test_ps_embedding_heterogeneous_conv2d_adam.py --device_target=$DEVICE_TARGET --dataset_path=$DATASET_PATH &
 done
 wait $!
 exit $?
--- a/tests/st/ps/part_ps/test_entry_ps_embedding_heterogeneous_conv2d_adam.py
+++ b/tests/st/ps/part_ps/test_entry_ps_embedding_heterogeneous_conv2d_adam.py
@ -0,0 +1,27 @@
 # Copyright 2020 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 # http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ============================================================================
 import os
 import pytest
@pytest.mark.level0
@pytest.mark.platform_arm_ascend_training
@pytest.mark.platform_x86_ascend_training
@pytest.mark.env_onecard
 def test_ps_embedding_heterogeneous_conv2d_adam():
    return_code = os.system(
        "bash shell_run_test.sh Ascend /home/workspace/mindspore_dataset/mnist 1 1 127.0.0.1 8085"
    )
    assert return_code == 0
--- a/tests/st/ps/part_ps/test_ps_embedding_heterogeneous_conv2d_adam.py
+++ b/tests/st/ps/part_ps/test_ps_embedding_heterogeneous_conv2d_adam.py
@ -0,0 +1,182 @@
 # Copyright 2020 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 # http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ============================================================================
 import os
 import argparse
 import numpy as np
 import mindspore.context as context
 import mindspore.dataset as ds
 import mindspore.dataset.transforms.c_transforms as C
 import mindspore.dataset.vision.c_transforms as CV
 from mindspore.common import dtype as mstype
 from mindspore.dataset.vision import Inter
 from mindspore.common.tensor import Tensor
 from mindspore.nn import Cell
 from mindspore.nn import Flatten
 from mindspore.nn import Conv2d
 from mindspore.nn import BatchNorm2d
 from mindspore.nn import SoftmaxCrossEntropyWithLogits
 from mindspore.nn import Adam
 from mindspore.nn import EmbeddingLookup
 from mindspore.nn import ReLU
 import mindspore
 import mindspore.ops.operations as op
 from mindspore.common.parameter import Parameter
 from mindspore.train import Model
 from mindspore.common import set_seed
 parser = argparse.ArgumentParser(description='test_ps_lenet')
 parser.add_argument("--device_target", type=str, default="Ascend")
 parser.add_argument("--dataset_path", type=str, default="/home/workspace/mindspore_dataset/mnist")
 args, _ = parser.parse_known_args()
 device_target = args.device_target
 dataset_path = args.dataset_path
 context.set_context(mode=context.GRAPH_MODE, device_target=device_target, enable_sparse=True)
 context.set_ps_context(enable_ps=True)
 class Menet(Cell):
    def __init__(self, in_channels, out_channels, kernel_size, vocab_size, embedding_size,
                 output_channels, target, sparse):
        super().__init__()
        set_seed(5)
        self.relu = ReLU()
        self.conv = Conv2d(in_channels=in_channels, out_channels=out_channels,
                           kernel_size=kernel_size, has_bias=True, weight_init='normal')
        self.batchnorm = BatchNorm2d(num_features=out_channels)
        self.embedding_lookup = EmbeddingLookup(vocab_size=vocab_size,
                                                embedding_size=embedding_size,
                                                param_init='normal', target=target, sparse=sparse)
        self.flatten = Flatten()
        self.cast = op.Cast()
        self.bias = Parameter(Tensor(np.ones([output_channels]).astype(np.float32)), name='bias')
        self.biasadd = op.BiasAdd()
        self.type = mindspore.int32
    def construct(self, x):
        x = self.conv(x)
        x = self.batchnorm(x)
        x = self.flatten(x)
        x = self.relu(x)
        x = self.cast(x, self.type)
        x = self.embedding_lookup(x)
        x = self.flatten(x)
        x = self.biasadd(x, self.bias)
        x = self.biasadd(x, self.bias)
        return x
 def create_dataset(data_path, batch_size=32, repeat_size=1,
                   num_parallel_workers=1):
    """
    create dataset for train or test
    """
    # define dataset
    mnist_ds = ds.MnistDataset(data_path)
    resize_height, resize_width = 32, 32
    rescale = 1.0 / 255.0
    shift = 0.0
    rescale_nml = 1 / 0.3081
    shift_nml = -1 * 0.1307 / 0.3081
    # define map operations
    resize_op = CV.Resize((resize_height, resize_width),
                          interpolation=Inter.LINEAR)  # Bilinear mode
    rescale_nml_op = CV.Rescale(rescale_nml, shift_nml)
    rescale_op = CV.Rescale(rescale, shift)
    hwc2chw_op = CV.HWC2CHW()
    type_cast_op = C.TypeCast(mstype.int32)
    # apply map operations on images
    mnist_ds = mnist_ds.map(operations=type_cast_op, input_columns="label",
                            num_parallel_workers=num_parallel_workers)
    mnist_ds = mnist_ds.map(operations=resize_op, input_columns="image",
                            num_parallel_workers=num_parallel_workers)
    mnist_ds = mnist_ds.map(operations=rescale_op, input_columns="image",
                            num_parallel_workers=num_parallel_workers)
    mnist_ds = mnist_ds.map(operations=rescale_nml_op, input_columns="image",
                            num_parallel_workers=num_parallel_workers)
    mnist_ds = mnist_ds.map(operations=hwc2chw_op, input_columns="image",
                            num_parallel_workers=num_parallel_workers)
    # apply DatasetOps
    buffer_size = 10000
    mnist_ds = mnist_ds.shuffle(buffer_size=buffer_size)  # 10000 as in LeNet train script
    mnist_ds = mnist_ds.batch(batch_size, drop_remainder=True)
    mnist_ds = mnist_ds.repeat(repeat_size)
    return mnist_ds
 class NetFactory:
    def __init__(self, dataset, input_shape=(2, 1, 32, 32), in_channels=1, out_channels=3,
                 kernel_size=5, vocab_size=5, embedding_size=1, output_channels=3072,
                 epoch_size=1, target='CPU', sparse=True):
        self.in_channels = in_channels
        self.out_channels = out_channels
        self.kernel_size = kernel_size
        self.vocab_size = vocab_size
        self.embedding_size = embedding_size
        self.output_channels = output_channels
        self.dataset = dataset
        self.epoch_size = epoch_size
        self.target = target
        self.sparse = sparse
        self.input_np = np.random.randn(*input_shape).astype(np.float32)
    def no_ps_impl(self):
        context.set_ps_context(enable_ps=False)
        net = Menet(self.in_channels, self.out_channels, self.kernel_size, self.vocab_size,
                    self.embedding_size, self.output_channels, self.target, self.sparse)
        net.conv.conv2d.add_prim_attr('primitive_target', 'CPU')
        net.conv.bias_add.add_prim_attr('primitive_target', 'CPU')
        net.set_train()
        loss = SoftmaxCrossEntropyWithLogits(sparse=True, reduction='mean')
        opt = Adam(params=filter(lambda x: x.requires_grad, net.get_parameters()))
        opt.target = 'CPU'
        model = Model(net, loss, opt)
        model.train(self.epoch_size, self.dataset, dataset_sink_mode=False)
        input_me = Tensor(self.input_np)
        out_me = model.predict(input_me)
        context.set_ps_context(enable_ps=True)
        return out_me.asnumpy()
    def part_ps_impl(self):
        net = Menet(self.in_channels, self.out_channels, self.kernel_size, self.vocab_size,
                    self.embedding_size, self.output_channels, self.target, self.sparse)
        net.embedding_lookup.set_param_ps()
        net.conv.conv2d.add_prim_attr('primitive_target', 'CPU')
        net.conv.bias_add.add_prim_attr('primitive_target', 'CPU')
        net.set_train()
        loss = SoftmaxCrossEntropyWithLogits(sparse=True, reduction='mean')
        opt = Adam(params=filter(lambda x: x.requires_grad, net.get_parameters()))
        opt.target = 'CPU'
        model = Model(net, loss, opt)
        model.train(self.epoch_size, self.dataset, dataset_sink_mode=False)
        input_me = Tensor(self.input_np)
        out_me = model.predict(input_me)
        return out_me.asnumpy()
    def part_cmp(self):
        part_ps = self.part_ps_impl()
        no_ps = self.no_ps_impl()
        assert np.allclose(no_ps, part_ps, rtol=1.0e-5, atol=1.0e-5)
 if __name__ == "__main__":
    datasets = create_dataset(os.path.join(dataset_path, "train"), 32, 1)
    fact = NetFactory(dataset=datasets)
    fact.part_cmp()