From 33b2735560ca19fe629f3c84398801dbf003cdc6 Mon Sep 17 00:00:00 2001
From: zhaodezan <zhaodezan@huawei.com>
Date: Tue, 22 Sep 2020 09:35:31 -0400
Subject: [PATCH] pad int8 surpport mirror pad.

---
 mindspore/lite/nnacl/int8/pad.c               |  37 +++++
 mindspore/lite/nnacl/int8/pad.h               |   2 +
 .../src/runtime/kernel/arm/int8/pad_int8.cc   | 152 +++++++++++++++++-
 .../src/runtime/kernel/arm/int8/pad_int8.h    |   7 +
 4 files changed, 193 insertions(+), 5 deletions(-)
diff --git a/mindspore/lite/nnacl/int8/pad.c b/mindspore/lite/nnacl/int8/pad.c
index 6353ebbb14..f1da8c1f83 100644
--- a/mindspore/lite/nnacl/int8/pad.c
+++ b/mindspore/lite/nnacl/int8/pad.c
@@ -32,3 +32,40 @@ int PadConstant4D(const int8_t *in_data, int8_t *out_data, const int32_t *in_dim
   }
   return NNACL_OK;
 }
+
+int TransOut2InputDimIndexInt8(int out_dim_index, int left_pad, int in_dim, int offset) {
+  if (out_dim_index < left_pad) {
+    // left pad
+    const int index_sum = left_pad + offset - 1;
+    return MSMAX(index_sum - out_dim_index, offset);
+  }
+  out_dim_index -= left_pad;
+  if (out_dim_index < in_dim) {
+    return out_dim_index;
+  }
+  // right pad
+  out_dim_index -= in_dim;
+  const int index_sum = in_dim - 1 - offset;
+  return MSMAX(index_sum - out_dim_index, 0);
+}
+
+int GetInputFlattenIndexInt8(int out_flatten_index, const int *input_shape, const PadParameter *pad_param) {
+  int in_flatten_index = 0;
+  int i;
+  for (i = 0; i < DEFAULT_PAD_NDIMS; ++i) {
+    int left_pad = pad_param->paddings_[i * 2];
+    int out_dim_index = out_flatten_index / pad_param->out_strides[i];
+    out_flatten_index %= pad_param->out_strides[i];
+    int in_dim_index = TransOut2InputDimIndexInt8(out_dim_index, left_pad, input_shape[i], pad_param->mirror_offset_);
+    in_flatten_index += in_dim_index * pad_param->in_strides[i];
+  }
+  return in_flatten_index;
+}
+
+void MirrorPadInt8(const int8_t *input_data, int8_t *output_data, const int *input_shape, const PadParameter *pad_param,
+                   int begin, int end) {
+  int i = 0;
+  for (i = begin; i < end; ++i) {
+    output_data[i] = input_data[GetInputFlattenIndexInt8(i, input_shape, pad_param)];
+  }
+}
diff --git a/mindspore/lite/nnacl/int8/pad.h b/mindspore/lite/nnacl/int8/pad.h
index 28d5c7fee1..41da165558 100644
--- a/mindspore/lite/nnacl/int8/pad.h
+++ b/mindspore/lite/nnacl/int8/pad.h
@@ -26,6 +26,8 @@ extern "C" {
 #endif
 int PadConstant4D(const int8_t *in_data, int8_t *out_data, const int32_t *in_dims, const int32_t *out_dims,
                   const int32_t *paddings, const int tid, const int thread_num);
+void MirrorPadInt8(const int8_t *input_data, int8_t *output_data, const int *input_shape, const PadParameter *pad_param,
+                   int begin, int end);
 #ifdef __cplusplus
 }
 #endif
diff --git a/mindspore/lite/src/runtime/kernel/arm/int8/pad_int8.cc b/mindspore/lite/src/runtime/kernel/arm/int8/pad_int8.cc
index 7405679cad..0ca7518696 100644
--- a/mindspore/lite/src/runtime/kernel/arm/int8/pad_int8.cc
+++ b/mindspore/lite/src/runtime/kernel/arm/int8/pad_int8.cc
@@ -15,12 +15,23 @@
  */
 
 #include "src/runtime/kernel/arm/int8/pad_int8.h"
+#include <string>
+#include "include/errorcode.h"
+#include "nnacl/errorcode.h"
+#include "nnacl/int8/pad.h"
+#include "src/runtime/runtime_api.h"
 
 using mindspore::lite::RET_ERROR;
 using mindspore::lite::RET_MEMORY_FAILED;
 using mindspore::lite::RET_OK;
+using mindspore::lite::RET_NULL_PTR;
 
 namespace mindspore::kernel {
+
+namespace {
+constexpr size_t kMirrorPadInputSize = 2;
+}
+
 void PadInt8CPUKernel::FreeQuantParam() {
   if (pad_param_->pad_quant_arg_.in_quant_args_ != nullptr) {
     free(pad_param_->pad_quant_arg_.in_quant_args_);
@@ -122,6 +133,123 @@ int PadInt8Impl(void *cdata, int task_id) {
   return RET_OK;
 }
 
+int PadInt8CPUKernel::HandleMirrorPad() {
+  auto ret = CopyPaddingFromInput();
+  if (ret != RET_OK) {
+    return ret;
+  }
+  ret = CheckPaddings(pad_param_->paddings_, DEFAULT_PAD_NDIMS, in_dims_, pad_param_->pad_mode_);
+  if (ret != RET_OK) {
+    return ret;
+  }
+  CalculateStrides();
+  pad_param_->mirror_offset_ = pad_param_->pad_mode_ == static_cast<int>(schema::PaddingMode_REFLECT) ? 1 : 0;
+  return RET_OK;
+}
+
+void PadInt8CPUKernel::CalculateStrides() {
+  pad_param_->in_strides[DEFAULT_PAD_NDIMS - 1] = 1;
+  for (auto i = DEFAULT_PAD_NDIMS - 2; i >= 0; --i) {
+    pad_param_->in_strides[i] = in_dims_[i + 1] * pad_param_->in_strides[i + 1];
+  }
+  for (auto i = 0; i < DEFAULT_PAD_NDIMS; ++i) {
+    out_dims_[i] = in_dims_[i] + pad_param_->paddings_[i * 2] + pad_param_->paddings_[i * 2 + 1];
+  }
+  pad_param_->out_strides[DEFAULT_PAD_NDIMS - 1] = 1;
+  for (auto i = DEFAULT_PAD_NDIMS - 2; i >= 0; --i) {
+    pad_param_->out_strides[i] = out_dims_[i + 1] * pad_param_->out_strides[i + 1];
+  }
+}
+
+int PadInt8CPUKernel::ExtendPaddings(int *paddings, int length, const int *ori_paddings, int ori_length) {
+  if (paddings == nullptr || ori_paddings == nullptr) {
+    return RET_NULL_PTR;
+  }
+  for (auto i = 0; i < length - ori_length; ++i) {
+    paddings[i] = 0;
+  }
+  for (auto i = length - ori_length; i < length; ++i) {
+    paddings[i] = ori_paddings[i - (length - ori_length)];
+  }
+  return RET_OK;
+}
+
+int PadInt8CPUKernel::RunMirrorPadImpl(int task_id) {
+  auto input = in_tensors_.at(0);
+  auto output = out_tensors_.at(0);
+  auto input_data = reinterpret_cast<int8_t *>(input->MutableData());
+  auto output_data = reinterpret_cast<int8_t *>(output->MutableData());
+
+  int unit = UP_DIV(output->ElementsNum(), context_->thread_num_);
+  int begin = unit * task_id;
+  int end = MSMIN(begin + unit, output->ElementsNum());
+  MirrorPadInt8(input_data, output_data, in_dims_, pad_param_, begin, end);
+  return RET_OK;
+}
+
+int MirrorPadImplInt8(void *cdata, int task_id) {
+  auto padKernel = reinterpret_cast<PadInt8CPUKernel *>(cdata);
+  int error_code = padKernel->RunMirrorPadImpl(task_id);
+  if (error_code != NNACL_OK) {
+    MS_LOG(ERROR) << "Pad Run error task_id[" << task_id << "] error_code[" << error_code << "]";
+    return RET_ERROR;
+  }
+  return RET_OK;
+}
+
+int PadInt8CPUKernel::CheckPaddings(int *paddings, int length, int *input_shape, int mode) {
+  if (paddings == nullptr || input_shape == nullptr) {
+    return RET_NULL_PTR;
+  }
+  std::string prefix;
+  int offset;
+  if (mode == static_cast<int>(schema::PaddingMode_SYMMETRIC)) {
+    prefix = "For Pad SYMMETRIC ";
+    offset = 0;
+  } else {
+    prefix = "For Pad REFLECT ";
+    offset = 1;
+  }
+  for (auto i = 0; i < length; ++i) {
+    int max_valid = input_shape[i] - offset;
+    if (paddings[i * 2] > max_valid) {
+      MS_LOG(ERROR) << prefix << "paddings " << paddings[i * 2] << "should be less than " << max_valid + 1;
+      return RET_ERROR;
+    }
+    if (paddings[i * 2 + 1] > max_valid) {
+      MS_LOG(ERROR) << prefix << "paddings " << paddings[i * 2 + 1] << "should be less than " << max_valid + 1;
+      return RET_ERROR;
+    }
+  }
+  return RET_OK;
+}
+
+int PadInt8CPUKernel::CopyPaddingFromInput() {
+  if (in_tensors_.size() != kMirrorPadInputSize) {
+    MS_LOG(ERROR) << "Pad Reflect or Symmetric mode need 2 inputs, got " << in_tensors_.size();
+    return RET_ERROR;
+  }
+  auto padding_tensor = in_tensors_.at(1);
+  auto paddings = reinterpret_cast<int *>(padding_tensor->MutableData());
+  if (paddings == nullptr) {
+    MS_LOG(ERROR) << "Pad second input data nullptr";
+    return RET_ERROR;
+  }
+  auto input_shape = in_tensors_.at(0)->shape();
+  int rank = static_cast<int>(input_shape.size());
+  if (padding_tensor->ElementsNum() != rank * 2) {
+    MS_LOG(ERROR) << "Pad second input elements num" << padding_tensor->ElementsNum() << ", should be " << rank * 2;
+    return RET_ERROR;
+  }
+
+  auto ret = ExtendPaddings(pad_param_->paddings_, MAX_PAD_SIZE, paddings, padding_tensor->ElementsNum());
+  if (ret != RET_OK) {
+    return ret;
+  }
+  pad_param_->padding_length = MAX_PAD_SIZE;
+  return RET_OK;
+}
+
 int PadInt8CPUKernel::Run() {
   auto ret = Prepare();
   if (ret != RET_OK) {
@@ -131,12 +259,26 @@ int PadInt8CPUKernel::Run() {
   in_data_ = reinterpret_cast<int8_t *>(in_tensors_[0]->MutableData());
   out_data_ = reinterpret_cast<int8_t *>(out_tensors_[0]->MutableData());
 
-  memset(out_data_, pad_param_->pad_quant_arg_.constant_value_[0], out_tensors_[0]->ElementsNum() * sizeof(int8_t));
-  int error_code = ParallelLaunch(this->context_->thread_pool_, PadInt8Impl, this, context_->thread_num_);
-  if (error_code != RET_OK) {
-    MS_LOG(ERROR) << "Resize run error, error_code[" << error_code << "]";
-    return RET_ERROR;
+  int error_code;
+  if (pad_param_->pad_mode_ == static_cast<int>(schema::PaddingMode_CONSTANT)) {
+    memset(out_data_, pad_param_->pad_quant_arg_.constant_value_[0], out_tensors_[0]->ElementsNum() * sizeof(int8_t));
+    error_code = ParallelLaunch(this->context_->thread_pool_, PadInt8Impl, this, context_->thread_num_);
+    if (error_code != RET_OK) {
+      MS_LOG(ERROR) << "Resize run error, error_code[" << error_code << "]";
+      return RET_ERROR;
+    }
+  } else {
+    // mirror pad case
+    HandleMirrorPad();
+
+    error_code = ParallelLaunch(this->context_->thread_pool_, MirrorPadImplInt8, this, context_->thread_num_);
+    if (error_code != RET_OK) {
+      MS_LOG(ERROR) << "Pad Reflect or Symmetric mode run error, error_code[" << error_code << "]";
+      return RET_ERROR;
+    }
   }
+
+
   return RET_OK;
 }
 }  // namespace mindspore::kernel
diff --git a/mindspore/lite/src/runtime/kernel/arm/int8/pad_int8.h b/mindspore/lite/src/runtime/kernel/arm/int8/pad_int8.h
index b8b9ba294b..24c417e86d 100644
--- a/mindspore/lite/src/runtime/kernel/arm/int8/pad_int8.h
+++ b/mindspore/lite/src/runtime/kernel/arm/int8/pad_int8.h
@@ -39,6 +39,7 @@ class PadInt8CPUKernel : public LiteKernel {
   int ReSize() override;
   int Run() override;
   int RunImpl(int task_id);
+  int RunMirrorPadImpl(int task_id);
 
  private:
   int SetQuantParam();
@@ -46,6 +47,12 @@ class PadInt8CPUKernel : public LiteKernel {
   void FreeQuantParam();
 
  private:
+  int HandleMirrorPad();
+  int CheckPaddings(int *paddings, int length, int *input_shape, int mode);
+  int CopyPaddingFromInput();
+  void CalculateStrides();
+  int ExtendPaddings(int *paddings, int length, const int *ori_paddings, int ori_length);
+
   PadParameter *pad_param_ = nullptr;
   int8_t *in_data_ = nullptr;
   int8_t *out_data_ = nullptr;