Paddle/paddle/fluid/operators/prior_box_op.h

/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once
#include <algorithm>
#include <vector>
#include "paddle/fluid/framework/op_registry.h"
#include "paddle/fluid/operators/math/math_function.h"
#include "paddle/fluid/platform/transform.h"

namespace paddle {
namespace operators {

inline void ExpandAspectRatios(const std::vector<float>& input_aspect_ratior,
                               bool flip,
                               std::vector<float>* output_aspect_ratior) {
  constexpr float epsilon = 1e-6;
  output_aspect_ratior->clear();
  output_aspect_ratior->push_back(1.0f);
  for (size_t i = 0; i < input_aspect_ratior.size(); ++i) {
    float ar = input_aspect_ratior[i];
    bool already_exist = false;
    for (size_t j = 0; j < output_aspect_ratior->size(); ++j) {
      if (fabs(ar - output_aspect_ratior->at(j)) < epsilon) {
        already_exist = true;
        break;
      }
    }
    if (!already_exist) {
      output_aspect_ratior->push_back(ar);
      if (flip) {
        output_aspect_ratior->push_back(1.0f / ar);
      }
    }
  }
}

template <typename T>
struct ClipFunctor {
  HOSTDEVICE inline T operator()(T in) const {
    return std::min<T>(std::max<T>(in, 0.), 1.);
  }
};

template <typename T>
class PriorBoxOpKernel : public framework::OpKernel<T> {
 public:
  void Compute(const framework::ExecutionContext& ctx) const override {
    auto* input = ctx.Input<paddle::framework::Tensor>("Input");
    auto* image = ctx.Input<paddle::framework::Tensor>("Image");
    auto* boxes = ctx.Output<paddle::framework::Tensor>("Boxes");
    auto* vars = ctx.Output<paddle::framework::Tensor>("Variances");

    auto min_sizes = ctx.Attr<std::vector<float>>("min_sizes");
    auto max_sizes = ctx.Attr<std::vector<float>>("max_sizes");
    auto input_aspect_ratio = ctx.Attr<std::vector<float>>("aspect_ratios");
    auto variances = ctx.Attr<std::vector<float>>("variances");
    auto flip = ctx.Attr<bool>("flip");
    auto clip = ctx.Attr<bool>("clip");

    std::vector<float> aspect_ratios;
    ExpandAspectRatios(input_aspect_ratio, flip, &aspect_ratios);

    T step_w = static_cast<T>(ctx.Attr<float>("step_w"));
    T step_h = static_cast<T>(ctx.Attr<float>("step_h"));
    T offset = static_cast<T>(ctx.Attr<float>("offset"));

    auto img_width = image->dims()[3];
    auto img_height = image->dims()[2];

    auto feature_width = input->dims()[3];
    auto feature_height = input->dims()[2];

    T step_width, step_height;
    if (step_w == 0 || step_h == 0) {
      step_width = static_cast<T>(img_width) / feature_width;
      step_height = static_cast<T>(img_height) / feature_height;
    } else {
      step_width = step_w;
      step_height = step_h;
    }

    int num_priors = aspect_ratios.size() * min_sizes.size();
    if (max_sizes.size() > 0) {
      num_priors += max_sizes.size();
    }

    boxes->mutable_data<T>(ctx.GetPlace());
    vars->mutable_data<T>(ctx.GetPlace());

    auto e_boxes = framework::EigenTensor<T, 4>::From(*boxes);
    for (int h = 0; h < feature_height; ++h) {
      for (int w = 0; w < feature_width; ++w) {
        T center_x = (w + offset) * step_width;
        T center_y = (h + offset) * step_height;
        T box_width, box_height;
        int idx = 0;
        for (size_t s = 0; s < min_sizes.size(); ++s) {
          auto min_size = min_sizes[s];
          // priors with different aspect ratios
          for (size_t r = 0; r < aspect_ratios.size(); ++r) {
            float ar = aspect_ratios[r];
            box_width = min_size * sqrt(ar) / 2.;
            box_height = min_size / sqrt(ar) / 2.;
            e_boxes(h, w, idx, 0) = (center_x - box_width) / img_width;
            e_boxes(h, w, idx, 1) = (center_y - box_height) / img_height;
            e_boxes(h, w, idx, 2) = (center_x + box_width) / img_width;
            e_boxes(h, w, idx, 3) = (center_y + box_height) / img_height;
            idx++;
          }
          if (max_sizes.size() > 0) {
            auto max_size = max_sizes[s];
            // square prior with size sqrt(minSize * maxSize)
            box_width = box_height = sqrt(min_size * max_size) / 2.;
            e_boxes(h, w, idx, 0) = (center_x - box_width) / img_width;
            e_boxes(h, w, idx, 1) = (center_y - box_height) / img_height;
            e_boxes(h, w, idx, 2) = (center_x + box_width) / img_width;
            e_boxes(h, w, idx, 3) = (center_y + box_height) / img_height;
            idx++;
          }
        }
      }
    }

    if (clip) {
      platform::Transform<platform::CPUDeviceContext> trans;
      ClipFunctor<T> clip_func;
      trans(ctx.template device_context<platform::CPUDeviceContext>(),
            boxes->data<T>(), boxes->data<T>() + boxes->numel(),
            boxes->data<T>(), clip_func);
    }

    framework::Tensor var_t;
    var_t.mutable_data<T>(
        framework::make_ddim({1, static_cast<int>(variances.size())}),
        ctx.GetPlace());
    auto var_et = framework::EigenTensor<T, 2>::From(var_t);
    for (size_t i = 0; i < variances.size(); ++i) {
      var_et(0, i) = variances[i];
    }

    int box_num = feature_height * feature_width * num_priors;
    auto var_dim = vars->dims();
    vars->Resize({box_num, static_cast<int>(variances.size())});

    auto e_vars = framework::EigenMatrix<T, Eigen::RowMajor>::From(*vars);
    e_vars = var_et.broadcast(Eigen::DSizes<int, 2>(box_num, 1));

    vars->Resize(var_dim);
  }
};  // namespace operators

}  // namespace operators
}  // namespace paddle
Fix the grammar in copyright. (#8403) 7 years ago			`/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.`
implement of prior box operator for ssd 7 years ago
			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`

			`http://www.apache.org/licenses/LICENSE-2.0`

			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License. */`

			`#pragma once`
Fix CPPLint errors in operators (#9828) * Fix CPPLint errors in operators * Fix prior box op * Fix Prior Box op * Fix top_k_op.cu * Fix pool mkmldnn * Fix pool mkmldnn 7 years ago			`#include <algorithm>`
			`#include <vector>`
Correct #include path 7 years ago			`#include "paddle/fluid/framework/op_registry.h"`
			`#include "paddle/fluid/operators/math/math_function.h"`
			`#include "paddle/fluid/platform/transform.h"`
implement of prior box operator for ssd 7 years ago
			`namespace paddle {`
			`namespace operators {`

update code 7 years ago			`inline void ExpandAspectRatios(const std::vector<float>& input_aspect_ratior,`
			`bool flip,`
Fix CPPLint errors in operators (#9828) * Fix CPPLint errors in operators * Fix prior box op * Fix Prior Box op * Fix top_k_op.cu * Fix pool mkmldnn * Fix pool mkmldnn 7 years ago			`std::vector<float>* output_aspect_ratior) {`
Merge branch 'develop' of https://github.com/PaddlePaddle/Paddle into prior_box 7 years ago			`constexpr float epsilon = 1e-6;`
Fix CPPLint errors in operators (#9828) * Fix CPPLint errors in operators * Fix prior box op * Fix Prior Box op * Fix top_k_op.cu * Fix pool mkmldnn * Fix pool mkmldnn 7 years ago			`output_aspect_ratior->clear();`
			`output_aspect_ratior->push_back(1.0f);`
implement of prior box operator for ssd 7 years ago			`for (size_t i = 0; i < input_aspect_ratior.size(); ++i) {`
			`float ar = input_aspect_ratior[i];`
			`bool already_exist = false;`
Fix CPPLint errors in operators (#9828) * Fix CPPLint errors in operators * Fix prior box op * Fix Prior Box op * Fix top_k_op.cu * Fix pool mkmldnn * Fix pool mkmldnn 7 years ago			`for (size_t j = 0; j < output_aspect_ratior->size(); ++j) {`
			`if (fabs(ar - output_aspect_ratior->at(j)) < epsilon) {`
implement of prior box operator for ssd 7 years ago			`already_exist = true;`
			`break;`
			`}`
			`}`
			`if (!already_exist) {`
Fix CPPLint errors in operators (#9828) * Fix CPPLint errors in operators * Fix prior box op * Fix Prior Box op * Fix top_k_op.cu * Fix pool mkmldnn * Fix pool mkmldnn 7 years ago			`output_aspect_ratior->push_back(ar);`
implement of prior box operator for ssd 7 years ago			`if (flip) {`
Fix CPPLint errors in operators (#9828) * Fix CPPLint errors in operators * Fix prior box op * Fix Prior Box op * Fix top_k_op.cu * Fix pool mkmldnn * Fix pool mkmldnn 7 years ago			`output_aspect_ratior->push_back(1.0f / ar);`
implement of prior box operator for ssd 7 years ago			`}`
			`}`
			`}`
			`}`

update code 7 years ago			`template <typename T>`
			`struct ClipFunctor {`
add "inline" for ClipFunctor and refine code 7 years ago			`HOSTDEVICE inline T operator()(T in) const {`
update code 7 years ago			`return std::min<T>(std::max<T>(in, 0.), 1.);`
			`}`
			`};`

Add CUDA kernel for prior_box_op. (#9553) 7 years ago			`template <typename T>`
implement of prior box operator for ssd 7 years ago			`class PriorBoxOpKernel : public framework::OpKernel<T> {`
			`public:`
			`void Compute(const framework::ExecutionContext& ctx) const override {`
			`auto* input = ctx.Input<paddle::framework::Tensor>("Input");`
			`auto* image = ctx.Input<paddle::framework::Tensor>("Image");`
update code 7 years ago			`auto* boxes = ctx.Output<paddle::framework::Tensor>("Boxes");`
			`auto* vars = ctx.Output<paddle::framework::Tensor>("Variances");`
implement of prior box operator for ssd 7 years ago
refine prior_box 7 years ago			`auto min_sizes = ctx.Attr<std::vector<float>>("min_sizes");`
			`auto max_sizes = ctx.Attr<std::vector<float>>("max_sizes");`
implement of prior box operator for ssd 7 years ago			`auto input_aspect_ratio = ctx.Attr<std::vector<float>>("aspect_ratios");`
			`auto variances = ctx.Attr<std::vector<float>>("variances");`
			`auto flip = ctx.Attr<bool>("flip");`
			`auto clip = ctx.Attr<bool>("clip");`

			`std::vector<float> aspect_ratios;`
Fix CPPLint errors in operators (#9828) * Fix CPPLint errors in operators * Fix prior box op * Fix Prior Box op * Fix top_k_op.cu * Fix pool mkmldnn * Fix pool mkmldnn 7 years ago			`ExpandAspectRatios(input_aspect_ratio, flip, &aspect_ratios);`
implement of prior box operator for ssd 7 years ago
update code 7 years ago			`T step_w = static_cast<T>(ctx.Attr<float>("step_w"));`
			`T step_h = static_cast<T>(ctx.Attr<float>("step_h"));`
			`T offset = static_cast<T>(ctx.Attr<float>("offset"));`
implement of prior box operator for ssd 7 years ago
update code 7 years ago			`auto img_width = image->dims()[3];`
			`auto img_height = image->dims()[2];`
implement of prior box operator for ssd 7 years ago
update code 7 years ago			`auto feature_width = input->dims()[3];`
			`auto feature_height = input->dims()[2];`
implement of prior box operator for ssd 7 years ago
update code 7 years ago			`T step_width, step_height;`
implement of prior box operator for ssd 7 years ago			`if (step_w == 0 \|\| step_h == 0) {`
update code 7 years ago			`step_width = static_cast<T>(img_width) / feature_width;`
			`step_height = static_cast<T>(img_height) / feature_height;`
implement of prior box operator for ssd 7 years ago			`} else {`
			`step_width = step_w;`
			`step_height = step_h;`
			`}`

			`int num_priors = aspect_ratios.size() * min_sizes.size();`
			`if (max_sizes.size() > 0) {`
			`num_priors += max_sizes.size();`
			`}`

update code 7 years ago			`boxes->mutable_data<T>(ctx.GetPlace());`
			`vars->mutable_data<T>(ctx.GetPlace());`
implement of prior box operator for ssd 7 years ago
update code 7 years ago			`auto e_boxes = framework::EigenTensor<T, 4>::From(*boxes);`
update code 7 years ago			`for (int h = 0; h < feature_height; ++h) {`
			`for (int w = 0; w < feature_width; ++w) {`
update code 7 years ago			`T center_x = (w + offset) * step_width;`
			`T center_y = (h + offset) * step_height;`
			`T box_width, box_height;`
change output shape to [2, layer_height, layer_width, num_priors, 4] 7 years ago			`int idx = 0;`
implement of prior box operator for ssd 7 years ago			`for (size_t s = 0; s < min_sizes.size(); ++s) {`
refine prior_box 7 years ago			`auto min_size = min_sizes[s];`
Add CUDA kernel for prior_box_op. (#9553) 7 years ago			`// priors with different aspect ratios`
			`for (size_t r = 0; r < aspect_ratios.size(); ++r) {`
			`float ar = aspect_ratios[r];`
			`box_width = min_size * sqrt(ar) / 2.;`
			`box_height = min_size / sqrt(ar) / 2.;`
Fix bug in detection_output and mAP calculation in SSD. (#8985) * Clipping bbox in the mAP evaluator calculation. * Fix bug in detection_output and mAP calculation in SSD. * Fix bug in detection.py. * Fix bug in test_detection_map_op.py. 7 years ago			`e_boxes(h, w, idx, 0) = (center_x - box_width) / img_width;`
			`e_boxes(h, w, idx, 1) = (center_y - box_height) / img_height;`
			`e_boxes(h, w, idx, 2) = (center_x + box_width) / img_width;`
			`e_boxes(h, w, idx, 3) = (center_y + box_height) / img_height;`
change output shape to [2, layer_height, layer_width, num_priors, 4] 7 years ago			`idx++;`
implement of prior box operator for ssd 7 years ago			`}`
Add CUDA kernel for prior_box_op. (#9553) 7 years ago			`if (max_sizes.size() > 0) {`
			`auto max_size = max_sizes[s];`
			`// square prior with size sqrt(minSize * maxSize)`
			`box_width = box_height = sqrt(min_size * max_size) / 2.;`
Fix bug in detection_output and mAP calculation in SSD. (#8985) * Clipping bbox in the mAP evaluator calculation. * Fix bug in detection_output and mAP calculation in SSD. * Fix bug in detection.py. * Fix bug in test_detection_map_op.py. 7 years ago			`e_boxes(h, w, idx, 0) = (center_x - box_width) / img_width;`
			`e_boxes(h, w, idx, 1) = (center_y - box_height) / img_height;`
			`e_boxes(h, w, idx, 2) = (center_x + box_width) / img_width;`
			`e_boxes(h, w, idx, 3) = (center_y + box_height) / img_height;`
change output shape to [2, layer_height, layer_width, num_priors, 4] 7 years ago			`idx++;`
implement of prior box operator for ssd 7 years ago			`}`
			`}`
			`}`
			`}`

			`if (clip) {`
update code 7 years ago			`platform::Transform<platform::CPUDeviceContext> trans;`
			`ClipFunctor<T> clip_func;`
			`trans(ctx.template device_context<platform::CPUDeviceContext>(),`
			`boxes->data<T>(), boxes->data<T>() + boxes->numel(),`
			`boxes->data<T>(), clip_func);`
implement of prior box operator for ssd 7 years ago			`}`
update code 7 years ago
update code 7 years ago			`framework::Tensor var_t;`
			`var_t.mutable_data<T>(`
			`framework::make_ddim({1, static_cast<int>(variances.size())}),`
			`ctx.GetPlace());`
			`auto var_et = framework::EigenTensor<T, 2>::From(var_t);`
update code 7 years ago			`for (size_t i = 0; i < variances.size(); ++i) {`
update code 7 years ago			`var_et(0, i) = variances[i];`
implement of prior box operator for ssd 7 years ago			`}`
update code 7 years ago
update code 7 years ago			`int box_num = feature_height * feature_width * num_priors;`
update code 7 years ago			`auto var_dim = vars->dims();`
			`vars->Resize({box_num, static_cast<int>(variances.size())});`

			`auto e_vars = framework::EigenMatrix<T, Eigen::RowMajor>::From(*vars);`
			`e_vars = var_et.broadcast(Eigen::DSizes<int, 2>(box_num, 1));`

			`vars->Resize(var_dim);`
implement of prior box operator for ssd 7 years ago			`}`
update code 7 years ago			`}; // namespace operators`
implement of prior box operator for ssd 7 years ago
			`} // namespace operators`
			`} // namespace paddle`