test=develop, add distributed_infer (#30300)
* test=develop, add distributed_inferrevert-31562-mean
parent
96784ed6c8
commit
2a98e9323a
@ -0,0 +1,108 @@
|
||||
# Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
from __future__ import print_function
|
||||
|
||||
import os
|
||||
import shutil
|
||||
import unittest
|
||||
import tempfile
|
||||
import tarfile
|
||||
from test_dist_fleet_base import TestFleetBase
|
||||
from paddle.dataset.common import download, DATA_HOME
|
||||
|
||||
|
||||
class TestDistCtrInfer(TestFleetBase):
|
||||
def _setup_config(self):
|
||||
self._mode = "async"
|
||||
self._reader = "pyreader"
|
||||
self._need_test = 1
|
||||
|
||||
data_url = "https://fleet.bj.bcebos.com/unittest/ctr_saved_params.tar.gz"
|
||||
data_md5 = "aa7e8286ced566ea8a67410be7482438"
|
||||
module_name = "ctr_saved_params"
|
||||
path = download(data_url, module_name, data_md5)
|
||||
print('ctr_params is downloaded at ' + path)
|
||||
tar = tarfile.open(path)
|
||||
unzip_folder = tempfile.mkdtemp()
|
||||
tar.extractall(unzip_folder)
|
||||
self._model_dir = unzip_folder
|
||||
|
||||
def check_with_place(self,
|
||||
model_file,
|
||||
delta=1e-3,
|
||||
check_error_log=False,
|
||||
need_envs={}):
|
||||
required_envs = {
|
||||
"PATH": os.getenv("PATH", ""),
|
||||
"PYTHONPATH": os.getenv("PYTHONPATH", ""),
|
||||
"LD_LIBRARY_PATH": os.getenv("LD_LIBRARY_PATH", ""),
|
||||
"FLAGS_rpc_deadline": "30000", # 5sec to fail fast
|
||||
"http_proxy": "",
|
||||
"FLAGS_communicator_send_queue_size": "2",
|
||||
"FLAGS_communicator_max_merge_var_num": "2",
|
||||
"CPU_NUM": "2",
|
||||
}
|
||||
|
||||
required_envs.update(need_envs)
|
||||
|
||||
if check_error_log:
|
||||
required_envs["GLOG_v"] = "3"
|
||||
required_envs["GLOG_logtostderr"] = "1"
|
||||
|
||||
tr0_losses, tr1_losses = self._run_cluster(model_file, required_envs)
|
||||
|
||||
def test_dist_infer(self):
|
||||
self.check_with_place(
|
||||
"dist_fleet_ctr.py", delta=1e-5, check_error_log=False)
|
||||
shutil.rmtree(self._model_dir)
|
||||
|
||||
|
||||
class TestDistCtrTrainInfer(TestFleetBase):
|
||||
def _setup_config(self):
|
||||
self._mode = "async"
|
||||
self._reader = "pyreader"
|
||||
self._need_test = 1
|
||||
|
||||
def check_with_place(self,
|
||||
model_file,
|
||||
delta=1e-3,
|
||||
check_error_log=False,
|
||||
need_envs={}):
|
||||
required_envs = {
|
||||
"PATH": os.getenv("PATH", ""),
|
||||
"PYTHONPATH": os.getenv("PYTHONPATH", ""),
|
||||
"LD_LIBRARY_PATH": os.getenv("LD_LIBRARY_PATH", ""),
|
||||
"FLAGS_rpc_deadline": "30000", # 5sec to fail fast
|
||||
"http_proxy": "",
|
||||
"FLAGS_communicator_send_queue_size": "2",
|
||||
"FLAGS_communicator_max_merge_var_num": "2",
|
||||
"CPU_NUM": "2",
|
||||
}
|
||||
|
||||
required_envs.update(need_envs)
|
||||
|
||||
if check_error_log:
|
||||
required_envs["GLOG_v"] = "3"
|
||||
required_envs["GLOG_logtostderr"] = "1"
|
||||
|
||||
tr0_losses, tr1_losses = self._run_cluster(model_file, required_envs)
|
||||
|
||||
def test_dist_train_infer(self):
|
||||
self.check_with_place(
|
||||
"dist_fleet_ctr.py", delta=1e-5, check_error_log=False)
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
unittest.main()
|
Loading…
Reference in new issue