!2697 format device ascend code

Merge pull request !2697 from kisnwang/format-device-ascend-code
5 years ago · 7951b318d0
parent 2291213b8b 89c9f46a97
commit 7951b318d0
6 changed files with 122 additions and 102 deletions
--- a/mindspore/ccsrc/device/ascend/ascend_kernel_runtime.cc
+++ b/mindspore/ccsrc/device/ascend/ascend_kernel_runtime.cc
@ -68,9 +68,9 @@ std::string GetRankId() {
        int rank_offset = std::stoi(offset);
        rank_id += rank_offset;
      } catch (std::invalid_argument) {
-        MS_LOG(EXCEPTION) << "stoi invalid argument:" << offset;
+        MS_LOG(EXCEPTION) << "Call stoi invalid argument:" << offset;
      } catch (std::out_of_range) {
-        MS_LOG(EXCEPTION) << "stoi out_of_range:" << offset;
+        MS_LOG(EXCEPTION) << "Call stoi out_of_range:" << offset;
      }
    }
    rank_id_str = std::to_string(rank_id);
@ -81,7 +81,7 @@ std::string GetRankId() {
  rank_id_str = std::getenv("RANK_ID");
 #endif
  if (rank_id_str.empty()) {
-    MS_LOG(ERROR) << "get hccl rankid failed, please set env RANK_ID";
+    MS_LOG(ERROR) << "Get hccl rankid failed, please set env RANK_ID";
  }
  return rank_id_str;
 }
@ -100,7 +100,7 @@ void AscendKernelRuntime::ClearGraphModelMap() {
 }

 void AscendKernelRuntime::ClearGraphRuntimeResource(uint32_t graph_id) {
-  MS_LOG(DEBUG) << "clear graph:" << graph_id << " runtime resource";
+  MS_LOG(DEBUG) << "Clear graph:" << graph_id << " runtime resource";
  auto iter = graph_model_map_.find(graph_id);
  if (iter == graph_model_map_.end()) {
    MS_LOG(DEBUG) << "GraphId:" << graph_id << " not found";
@ -118,7 +118,7 @@ bool AscendKernelRuntime::NeedDestroyHccl() {
  auto context_ptr = MsContext::GetInstance();
  MS_EXCEPTION_IF_NULL(context_ptr);
  if (!context_ptr->enable_hccl()) {
-    MS_LOG(INFO) << "hccl is not enabled";
+    MS_LOG(INFO) << "Hccl is not enabled";
    return false;
  }
  // Note: make sure hcom_connectivity_detection api never be used.
@ -126,7 +126,7 @@ bool AscendKernelRuntime::NeedDestroyHccl() {
 }

 void AscendKernelRuntime::ReleaseDeviceRes() {
-  MS_LOG(INFO) << "ascend finalize start";
+  MS_LOG(INFO) << "Ascend finalize start";
  // release ge runtime
  ClearGraphModelMap();

@ -134,7 +134,7 @@ void AscendKernelRuntime::ReleaseDeviceRes() {
  MS_EXCEPTION_IF_NULL(context_ptr);
  auto ret = rtSetDevice(context_ptr->device_id());
  if (ret != RT_ERROR_NONE) {
-    MS_EXCEPTION(DeviceProcessError) << "rtSetDevice, ret[" << static_cast<int>(ret) << "]";
+    MS_EXCEPTION(DeviceProcessError) << "Call rtSetDevice, ret[" << static_cast<int>(ret) << "]";
  }

  if (mem_manager_ != nullptr) {
@ -144,7 +144,7 @@ void AscendKernelRuntime::ReleaseDeviceRes() {
  (void)DestroyHccl();
  (void)ResetDevice();
  (void)ProfilingManager::GetInstance().StopProfiling();
-  MS_LOG(INFO) << "ascend finalize end";
+  MS_LOG(INFO) << "Ascend finalize end";
 }

 bool AscendKernelRuntime::Init() {
@ -155,7 +155,7 @@ bool AscendKernelRuntime::Init() {
 #ifdef ENABLE_DUMP_E2E
  ret = SetDumpConf();
  if (!ret) {
-    MS_LOG(INFO) << "no dump conf to set!";
+    MS_LOG(INFO) << "No dump conf to set!";
  }
 #endif

@ -263,13 +263,13 @@ void DumpParameters(mindspore::session::KernelGraph *graph, const string &dump_p
 bool AscendKernelRuntime::DumpData(mindspore::session::KernelGraph *graph) {
  MS_EXCEPTION_IF_NULL(graph);
 #ifdef ENABLE_DUMP_E2E
-  MS_LOG(INFO) << "start dump step";
+  MS_LOG(INFO) << "Start dump step";
  DumpConfPtr dump_conf = GetDumpConf();
  MS_EXCEPTION_IF_NULL(dump_conf);
  dump_conf->UpdataCurIter();
  bool dump_flag = dump_conf->dump_enable();
  if (!dump_flag) {
-    MS_LOG(INFO) << "dump flag is disable, pass dump step";
+    MS_LOG(INFO) << "Dump flag is disable, pass dump step";
    return true;
  }
  uint32_t cur_iter = dump_conf->cur_iter();
@ -278,7 +278,7 @@ bool AscendKernelRuntime::DumpData(mindspore::session::KernelGraph *graph) {
      return true;
    }
  }
-  MS_LOG(INFO) << "cur iter is " << cur_iter;
+  MS_LOG(INFO) << "Cur iter is " << cur_iter;
  std::string net_name = dump_conf->dump_net_name();
  std::string iterator = to_string(cur_iter);
  std::string dump_path = dump_conf->dump_path();
@ -369,9 +369,9 @@ void LoadParameters(mindspore::session::KernelGraph *graph, Debugger *debugger)
 bool AscendKernelRuntime::LoadData(mindspore::session::KernelGraph *graph, Debugger *debugger) {
  MS_EXCEPTION_IF_NULL(graph);
 #ifdef ENABLE_DEBUGGER
-  MS_LOG(INFO) << "start load step";
+  MS_LOG(INFO) << "Start load step";
  uint32_t cur_iter = 0;
-  MS_LOG(INFO) << "cur iter is " << cur_iter;
+  MS_LOG(INFO) << "Cur iter is " << cur_iter;
  // load output
  LoadOutput(graph, debugger);
  // load parameters
@ -421,7 +421,7 @@ bool AscendKernelRuntime::GenTask(const session::KernelGraph *graph) {
  }
  // Graph may have no compute node, such TensorAddGrad.
  if (task_info_list.empty()) {
-    MS_LOG(WARNING) << "graph " << graph->graph_id() << " have no compute node";
+    MS_LOG(WARNING) << "Graph " << graph->graph_id() << " have no compute node";
    return true;
  }
  AscendStreamAssign &assign_instance = AscendStreamAssign::GetInstance();
@ -432,7 +432,7 @@ bool AscendKernelRuntime::GenTask(const session::KernelGraph *graph) {
  assign_instance.GetWaitStreams(&wait_active_stream_list);
  std::vector<uint32_t> force_copy_stream_list;
  assign_instance.GetHcomStreams(&force_copy_stream_list);
-  MS_LOG(INFO) << "call DavinciModel total stream num:" << resource_manager.get_cur_stream_num()
+  MS_LOG(INFO) << "Call DavinciModel total stream num:" << resource_manager.get_cur_stream_num()
               << ", total event num:" << resource_manager.get_cur_event_num()
               << ", total label num:" << label_assign_instance.GetLabelNum(NOT_NULL(graph))
               << ", wait_active_stream_list size:" << wait_active_stream_list.size()
@ -524,7 +524,7 @@ bool AscendKernelRuntime::RunTask(const session::KernelGraph *graph) {

  bool status = ge::model_runner::ModelRunner::Instance().RunModel(graph->graph_id(), input_tensors, output_tensors);
  if (!status) {
-    MS_LOG(ERROR) << "run task failed";
+    MS_LOG(ERROR) << "Run task failed";
    DebugTaskIdName(graph->graph_id());
    return false;
  }
@ -543,18 +543,18 @@ bool AscendKernelRuntime::InitDevice() {
  int device_count = 0;
  auto ret = rtGetDeviceCount(&device_count);
  if (ret != RT_ERROR_NONE) {
-    MS_EXCEPTION(DeviceProcessError) << "rtGetDeviceCount, ret[" << static_cast<int>(ret) << "]";
+    MS_EXCEPTION(DeviceProcessError) << "Call rtGetDeviceCount, ret[" << static_cast<int>(ret) << "]";
  }

  ret = rtSetDevice(device_id_);
  if (ret != RT_ERROR_NONE) {
-    MS_EXCEPTION(DeviceProcessError) << "rtSetDevice, ret[" << static_cast<int>(ret) << "]";
+    MS_EXCEPTION(DeviceProcessError) << "Call rtSetDevice, ret[" << static_cast<int>(ret) << "]";
  }

  auto context_ptr = MsContext::GetInstance();
  MS_EXCEPTION_IF_NULL(context_ptr);
  if (context_ptr == nullptr) {
-    MS_LOG(ERROR) << "get MsContext instance failed";
+    MS_LOG(ERROR) << "Get MsContext instance failed";
    return false;
  }
  if (context_ptr->enable_hccl()) {
@ -566,17 +566,17 @@ bool AscendKernelRuntime::InitDevice() {

  ret = rtCtxCreate(&rt_context_, 0, device_id_);
  if (ret != RT_ERROR_NONE) {
-    MS_EXCEPTION(DeviceProcessError) << "rtCtxCreate, ret[" << static_cast<int>(ret) << "]";
+    MS_EXCEPTION(DeviceProcessError) << "Call rtCtxCreate, ret[" << static_cast<int>(ret) << "]";
  }

  ret = rtCtxSetCurrent(rt_context_);
  if (ret != RT_ERROR_NONE) {
-    MS_EXCEPTION(DeviceProcessError) << "rtCtxSetCurrent, ret[" << ret << "]";
+    MS_EXCEPTION(DeviceProcessError) << "Call rtCtxSetCurrent, ret[" << ret << "]";
  }

  ret = rtStreamCreate(&stream_, 0);
  if (ret != RT_ERROR_NONE) {
-    MS_LOG(EXCEPTION) << "rtStreamCreate, ret[" << ret << "]";
+    MS_LOG(EXCEPTION) << "Call rtStreamCreate, ret[" << ret << "]";
  }

  return true;
@ -585,14 +585,14 @@ bool AscendKernelRuntime::InitDevice() {
 bool AscendKernelRuntime::ResetDevice() {
  auto ret = rtCtxSetCurrent(rt_context_);
  if (ret != RT_ERROR_NONE) {
-    MS_LOG(ERROR) << "call rtCtxSetCurrent failed";
+    MS_LOG(ERROR) << "Call rtCtxSetCurrent failed";
    return false;
  }

  if (stream_ != nullptr) {
    ret = rtStreamDestroy(stream_);
    if (ret != RT_ERROR_NONE) {
-      MS_LOG(EXCEPTION) << "rtStreamDestroy, ret[" << ret << "]";
+      MS_LOG(EXCEPTION) << "Call rtStreamDestroy, ret[" << ret << "]";
    }
    stream_ = nullptr;
  }
@ -600,7 +600,7 @@ bool AscendKernelRuntime::ResetDevice() {
  if (rt_context_ != nullptr) {
    ret = rtCtxDestroy(rt_context_);
    if (ret != RT_ERROR_NONE) {
-      MS_EXCEPTION(DeviceProcessError) << "rtCtxDestroy, ret[" << ret << "]";
+      MS_EXCEPTION(DeviceProcessError) << "Call rtCtxDestroy, ret[" << ret << "]";
    }
    rt_context_ = nullptr;
  }
@ -613,30 +613,30 @@ bool AscendKernelRuntime::HcclInit() {
  if (!context_ptr->IsTsdOpened()) {
    MS_LOG(EXCEPTION) << "Hccl dependent tsd is not open";
  }
-  MS_LOG(INFO) << "do hcom init";
+  MS_LOG(INFO) << "Do hcom init";
  auto config_path_str = std::getenv("MINDSPORE_HCCL_CONFIG_PATH");
  if (config_path_str == nullptr) {
    config_path_str = std::getenv("RANK_TABLE_FILE");
    if (config_path_str == nullptr) {
-      MS_LOG(ERROR) << "get hccl json config failed, please set env MINDSPORE_HCCL_CONFIG_PATH or RANK_TABLE_FILE";
+      MS_LOG(ERROR) << "Get hccl json config failed, please set env MINDSPORE_HCCL_CONFIG_PATH or RANK_TABLE_FILE";
      return false;
    }
  }
  if (strlen(config_path_str) > PATH_MAX) {
-    MS_LOG(ERROR) << "file path oversize";
+    MS_LOG(ERROR) << "File path oversize";
    return false;
  }
  std::string rank_id_str = GetRankId();
  auto full_path = realpath(config_path_str, nullptr);
  if (full_path == nullptr) {
-    MS_LOG(ERROR) << "file path " << config_path_str << " does not exist";
+    MS_LOG(ERROR) << "File path " << config_path_str << " does not exist";
    return false;
  }
  MS_LOG(INFO) << "MINDSPORE_HCCL_CONFIG_PATH : " << full_path << ", RANK_ID: " << rank_id_str;
  hcclResult_t res = hcom_init(full_path, rank_id_str.c_str());
  free(full_path);
  if (res != HCCL_SUCCESS) {
-    MS_LOG(ERROR) << "hcom init failed, res is " << static_cast<int>(res);
+    MS_LOG(ERROR) << "Hcom init failed, res is " << static_cast<int>(res);
    return false;
  }
  return true;
@ -646,15 +646,15 @@ bool AscendKernelRuntime::DestroyHccl() {
  auto context_ptr = MsContext::GetInstance();
  MS_EXCEPTION_IF_NULL(context_ptr);
  if (!NeedDestroyHccl()) {
-    MS_LOG(INFO) << "hccl is not enable, no need to close.";
+    MS_LOG(INFO) << "Hccl is not enable, no need to close.";
    return true;
  }
  hcclResult_t res = hcom_destroy();
  if (res != HCCL_SUCCESS) {
-    MS_LOG(ERROR) << "hccl destroy failed";
+    MS_LOG(ERROR) << "Hccl destroy failed";
    return false;
  }
-  MS_LOG(INFO) << "hccl destroy successful, status = " << res << ".";
+  MS_LOG(INFO) << "Hccl destroy successful, status = " << res << ".";
  context_ptr->set_enable_hccl(false);
  return true;
 }
--- a/mindspore/ccsrc/device/ascend/ascend_stream_assign.cc
+++ b/mindspore/ccsrc/device/ascend/ascend_stream_assign.cc
--- a/mindspore/ccsrc/device/cpu/cpu_kernel_runtime.cc
+++ b/mindspore/ccsrc/device/cpu/cpu_kernel_runtime.cc
@ -142,6 +142,37 @@ DeviceAddressPtr CPUKernelRuntime::CreateDeviceAddress(void *device_ptr, size_t
  return std::make_shared<CPUDeviceAddress>(device_ptr, device_size, format, type_id);
 }

+tensor::TensorPtr CPUKernelRuntime::CreatTensorForOutput(const CNodePtr &node, size_t index,
+                                                         std::set<DeviceAddressPtr> *bound_addresses,
+                                                         std::vector<tensor::TensorPtr> *need_sync_outputs) {
+  MS_EXCEPTION_IF_NULL(node);
+  MS_EXCEPTION_IF_NULL(bound_addresses);
+  MS_EXCEPTION_IF_NULL(need_sync_outputs);
+  size_t output_size = AnfAlgo::GetOutputTensorNum(node);
+  if (index >= output_size) {
+    MS_LOG(EXCEPTION) << "Invalid input index " << index;
+  }
+  auto address = AnfAlgo::GetMutableOutputAddr(node, index);
+  MS_EXCEPTION_IF_NULL(address);
+  auto shape = AnfAlgo::GetOutputInferShape(node, index);
+  std::vector<int> temp_shape;
+  (void)temp_shape.insert(temp_shape.end(), shape.begin(), shape.end());
+  TypeId type_id = AnfAlgo::GetOutputInferDataType(node, index);
+  type_id = GetCPUSupportOutputTypeId(type_id);
+  tensor::TensorPtr tensor = std::make_shared<tensor::Tensor>(type_id, temp_shape);
+  MS_EXCEPTION_IF_NULL(tensor);
+  if (bound_addresses->find(address) != bound_addresses->end()) {
+    tensor->set_device_address(address);
+    need_sync_outputs->emplace_back(tensor);
+  } else {
+    address->ptr_ = tensor->data_c();
+    address->ref_count_ = INIT_NODE_REF;
+    (void)bound_addresses->insert(address);
+  }
+  tensor->set_dirty(false);
+  return tensor;
+}
+
 BaseRef CPUKernelRuntime::CreatTensorForOutput(const session::KernelWithIndex &kernel_with_index,
                                               const std::unordered_map<AnfNode *, tensor::TensorPtr> &input_map,
                                               std::set<DeviceAddressPtr> *bound_addresses,
@ -161,29 +192,7 @@ BaseRef CPUKernelRuntime::CreatTensorForOutput(const session::KernelWithIndex &k
      }
      return ret;
    }
-    size_t output_size = AnfAlgo::GetOutputTensorNum(node);
-    if (index >= output_size) {
-      MS_LOG(EXCEPTION) << "Invalid input index " << index;
-    }
-    auto address = AnfAlgo::GetMutableOutputAddr(node, index);
-    MS_EXCEPTION_IF_NULL(address);
-    auto shape = AnfAlgo::GetOutputInferShape(node, index);
-    std::vector<int> temp_shape;
-    (void)temp_shape.insert(temp_shape.end(), shape.begin(), shape.end());
-    TypeId type_id = AnfAlgo::GetOutputInferDataType(node, index);
-    type_id = GetCPUSupportOutputTypeId(type_id);
-    tensor::TensorPtr tensor = std::make_shared<tensor::Tensor>(type_id, temp_shape);
-    MS_EXCEPTION_IF_NULL(tensor);
-    if (bound_addresses->find(address) != bound_addresses->end()) {
-      tensor->set_device_address(address);
-      need_sync_outputs->emplace_back(tensor);
-    } else {
-      address->ptr_ = tensor->data_c();
-      address->ref_count_ = INIT_NODE_REF;
-      (void)bound_addresses->insert(address);
-    }
-    tensor->set_dirty(false);
-    return tensor;
+    return CreatTensorForOutput(node, index, bound_addresses, need_sync_outputs);
  } else if (input_node->isa<Parameter>() || input_node->isa<ValueNode>()) {
    auto iter = input_map.find(input_node.get());
    if (iter != input_map.end()) {
@ -247,6 +256,7 @@ void CPUKernelRuntime::BindInputOutput(const session::KernelGraph *kernel_graph,

 void CPUKernelRuntime::AddRuntimeAddress(DeviceAddress *address, std::vector<kernel::AddressPtr> *input_list) {
  MS_EXCEPTION_IF_NULL(address);
+  MS_EXCEPTION_IF_NULL(input_list);
  kernel::AddressPtr input = std::make_shared<kernel::Address>();
  MS_EXCEPTION_IF_NULL(input);
  if (address->ptr_ == nullptr) {
--- a/mindspore/ccsrc/device/cpu/cpu_kernel_runtime.h
+++ b/mindspore/ccsrc/device/cpu/cpu_kernel_runtime.h
@ -49,6 +49,10 @@ class CPUKernelRuntime : public KernelRuntime {
                                       TypeId type_id) override;

 private:
+  tensor::TensorPtr CreatTensorForOutput(const CNodePtr &node, size_t index,
+                                         std::set<DeviceAddressPtr> *bound_addresses,
+                                         std::vector<tensor::TensorPtr> *need_sync_outputs);
+
  BaseRef CreatTensorForOutput(const session::KernelWithIndex &kernel_with_index,
                               const std::unordered_map<AnfNode *, tensor::TensorPtr> &input_map,
                               std::set<DeviceAddressPtr> *bound_addresses,
--- a/mindspore/ccsrc/device/cpu/cpu_simple_mem_plan.cc
+++ b/mindspore/ccsrc/device/cpu/cpu_simple_mem_plan.cc
@ -56,7 +56,13 @@ void CPUSimpleMemPlan::MemPlan(const session::KernelGraph *graph) {
  graph_mem_size_[graph] = total_mem_size;
 }

-size_t CPUSimpleMemPlan::GetGraphMemSize(const session::KernelGraph *graph) { return graph_mem_size_[graph]; }
+size_t CPUSimpleMemPlan::GetGraphMemSize(const session::KernelGraph *graph) const {
+  auto iter = graph_mem_size_.find(graph);
+  if (iter != graph_mem_size_.end()) {
+    return iter->second;
+  }
+  return 0;
+}

 void CPUSimpleMemPlan::MemAssign(const session::KernelGraph *graph, uint8_t *base_ptr) {
  MS_EXCEPTION_IF_NULL(graph);
--- a/mindspore/ccsrc/device/cpu/cpu_simple_mem_plan.h
+++ b/mindspore/ccsrc/device/cpu/cpu_simple_mem_plan.h
@ -31,7 +31,7 @@ class CPUSimpleMemPlan {

  void MemPlan(const session::KernelGraph *graph);
  void MemAssign(const session::KernelGraph *graph, uint8_t *base_ptr);
-  size_t GetGraphMemSize(const session::KernelGraph *graph);
+  size_t GetGraphMemSize(const session::KernelGraph *graph) const;

 private:
  std::unordered_map<const session::KernelGraph *, size_t> graph_mem_size_;