refine code and fix

7 years ago · e6d8aca3bf
parent ea7dc9cbf6
commit e6d8aca3bf
5 changed files with 214 additions and 213 deletions
--- a/paddle/fluid/operators/math/jit_kernel.h
+++ b/paddle/fluid/operators/math/jit_kernel.h
@ -64,32 +64,32 @@ class KernelPool {
 template <typename T>
 class VMulKernel : public Kernel {
 public:
-  virtual void Compute(const int n, const T *x, const T *y, T *z) const = 0;
+  virtual void Compute(const T *x, const T *y, T *z) const = 0;
 };

 template <typename T>
 class VAddKernel : public Kernel {
 public:
-  virtual void Compute(const int n, const T *x, const T *y, T *z) const = 0;
+  virtual void Compute(const T *x, const T *y, T *z) const = 0;
 };

 template <typename T>
 class VScalKernel : public Kernel {
 public:
-  virtual void Compute(const int n, const T a, const T *x, T *y) const = 0;
-  virtual void Compute(const int n, const T a, T *x) const = 0;
+  virtual void Compute(const T a, const T *x, T *y) const = 0;
+  virtual void Compute(const T a, T *x) const = 0;
 };

 template <typename T>
 class VAddBiasKernel : public Kernel {
 public:
-  virtual void Compute(const int n, const T a, const T *x, T *y) const = 0;
+  virtual void Compute(const T a, const T *x, T *y) const = 0;
 };

 template <typename T>
 class VExpKernel : public Kernel {
 public:
-  virtual void Compute(const int n, const T *x, T *y) const = 0;
+  virtual void Compute(const T *x, T *y) const = 0;
 };

 template <typename T>
--- a/paddle/fluid/operators/math/jit_kernel_blas.cc
+++ b/paddle/fluid/operators/math/jit_kernel_blas.cc
--- a/paddle/fluid/operators/math/jit_kernel_exp.cc
+++ b/paddle/fluid/operators/math/jit_kernel_exp.cc
--- a/paddle/fluid/operators/math/jit_kernel_macro.h
+++ b/paddle/fluid/operators/math/jit_kernel_macro.h
@ -57,7 +57,7 @@ namespace jit = platform::jit;

 #define JITKERNEL_NEW_IMPL(ker, dtype, isa, k) \
  p = std::dynamic_pointer_cast<ker<dtype>>(   \
-      std::make_shared<ker##Impl<dtype, isa, k>>())
+      std::make_shared<ker##Impl<dtype, isa, k>>(d))

 #define JITKERNEL_WITH_DTYPE(ker_key, ker_class, ker_dtype, dtype_key, \
                             marco_declare, macro_key, macro_impl)     \
--- a/paddle/fluid/operators/math/jit_kernel_test.cc
+++ b/paddle/fluid/operators/math/jit_kernel_test.cc
@ -73,7 +73,7 @@ TEST(JitKernel, vaddbias) {
    auto trefe = GetCurrentUS();
    auto ttgts = GetCurrentUS();
    for (int i = 0; i < repeat; ++i) {
-      ker->Compute(d, a, x_data, ztgt_data);
+      ker->Compute(a, x_data, ztgt_data);
    }
    auto ttgte = GetCurrentUS();

@ -99,7 +99,7 @@ void vexp_mkl(const int n, const float* x, float* y) {

 TEST(JitKernel, vexp) {
  namespace jit = paddle::operators::math::jitkernel;
-  for (int d : {7, 8, 15, 16, 30, 128}) {
+  for (int d : {7, 8, 15, 16, 30, 128, 256}) {
    std::vector<float> x(d);
    std::vector<float> zref(d), ztgt(d);
    RandomVec<float>(d, x.data(), -2.f, 2.f);
@ -124,7 +124,7 @@ TEST(JitKernel, vexp) {

    auto ttgts = GetCurrentUS();
    for (int i = 0; i < repeat; ++i) {
-      ker->Compute(d, x_data, ztgt_data);
+      ker->Compute(x_data, ztgt_data);
    }
    auto ttgte = GetCurrentUS();

@ -164,7 +164,7 @@ void vsigmoid_better(
    y[i] = (x[i] < min) ? min : ((x[i] > max) ? max : x[i]);
    y[i] = 0.f - y[i];
  }
-  vexp->Compute(n, y, y);
+  vexp->Compute(y, y);
  for (int i = 0; i < n; ++i) {
    y[i] = 1.f / (1.f + y[i]);
  }
@ -226,10 +226,10 @@ void vtanh_better(
        const paddle::operators::math::jitkernel::VAddBiasKernel<float>>&
        vaddbias,
    const int n, const float* x, float* y) {
-  vscal->Compute(n, 2.f, x, y);
+  vscal->Compute(2.f, x, y);
  vsigmoid->Compute(y, y);
-  vscal->Compute(n, 2.f, y);
-  vaddbias->Compute(n, -1.f, y, y);
+  vscal->Compute(2.f, y);
+  vaddbias->Compute(-1.f, y, y);
 }

 TEST(JitKernel, vtanh) {
@ -359,12 +359,12 @@ TEST(JitKernel, vscal) {

    auto ttgts = GetCurrentUS();
    for (int i = 0; i < repeat; ++i) {
-      ker->Compute(d, a, x_data, ztgt_data);
+      ker->Compute(a, x_data, ztgt_data);
    }
    auto ttgte = GetCurrentUS();
    auto ttgts1 = GetCurrentUS();
    for (int i = 0; i < repeat; ++i) {
-      ker->Compute(d, a, y_data);
+      ker->Compute(a, y_data);
    }
    auto ttgte1 = GetCurrentUS();
    VLOG(3) << "Vec size " << d << ": refer takes: " << (trefe - trefs) / repeat
@ -444,7 +444,7 @@ TEST(JitKernel, vmul) {

    auto ttgts = GetCurrentUS();
    for (int i = 0; i < repeat; ++i) {
-      ker->Compute(d, x_data, y_data, ztgt_data);
+      ker->Compute(x_data, y_data, ztgt_data);
    }
    auto ttgte = GetCurrentUS();

@ -523,7 +523,7 @@ TEST(JitKernel, vadd) {

    auto ttgts = GetCurrentUS();
    for (int i = 0; i < repeat; ++i) {
-      ker->Compute(d, x_data, y_data, ztgt_data);
+      ker->Compute(x_data, y_data, ztgt_data);
    }
    auto ttgte = GetCurrentUS();