You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
769 lines
26 KiB
769 lines
26 KiB
/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License. */
|
|
|
|
#include <random>
|
|
#include <string>
|
|
#include <vector>
|
|
#include "gflags/gflags.h"
|
|
#include "glog/logging.h"
|
|
#include "gtest/gtest.h"
|
|
#include "paddle/fluid/operators/jit/kernels.h"
|
|
#include "paddle/fluid/platform/cpu_info.h"
|
|
#include "paddle/fluid/platform/place.h"
|
|
|
|
DEFINE_double(acc, 1e-5, "Test accuracy threshold.");
|
|
|
|
template <typename T>
|
|
void RandomVec(const int n, T* a, const T lower = static_cast<T>(-20.f),
|
|
const T upper = static_cast<T>(20.f)) {
|
|
static unsigned int seed = 100;
|
|
std::mt19937 rng(seed++);
|
|
std::uniform_real_distribution<double> uniform_dist(0, 1);
|
|
for (int i = 0; i < n; ++i) {
|
|
a[i] = static_cast<T>(uniform_dist(rng) * (upper - lower) + lower);
|
|
}
|
|
}
|
|
|
|
template <typename T>
|
|
void ExpectEQ(const T* target, const T* refer, int n) {
|
|
if (std::is_floating_point<T>::value) {
|
|
for (int i = 0; i < n; ++i) {
|
|
EXPECT_NEAR(target[i], refer[i], FLAGS_acc);
|
|
}
|
|
} else {
|
|
for (int i = 0; i < n; ++i) {
|
|
EXPECT_EQ(target[i], refer[i]);
|
|
}
|
|
}
|
|
}
|
|
|
|
std::vector<int> TestSizes() {
|
|
std::vector<int> s;
|
|
for (int i = 1; i < 32; ++i) {
|
|
s.push_back(i);
|
|
}
|
|
// test some large size
|
|
s.push_back(100);
|
|
s.push_back(1000);
|
|
s.push_back(2000);
|
|
return s;
|
|
}
|
|
|
|
namespace jit = paddle::operators::jit;
|
|
using CPUPlace = paddle::platform::CPUPlace;
|
|
|
|
template <typename KernelTuples, typename... Args>
|
|
struct TestFuncWithRefer {
|
|
void operator()(const typename KernelTuples::func_type tgt, Args... args) {
|
|
LOG(FATAL) << "Should specify this function.";
|
|
}
|
|
};
|
|
|
|
template <typename T>
|
|
struct TestFuncWithRefer<jit::XYZNTuples<T>, std::vector<T>, std::vector<T>,
|
|
std::vector<T>> {
|
|
void operator()(const typename jit::XYZNTuples<T>::func_type tgt,
|
|
const std::vector<T>& x, const std::vector<T>& y,
|
|
const std::vector<T>& zref) {
|
|
EXPECT_TRUE(tgt != nullptr);
|
|
EXPECT_EQ(zref.size(), x.size());
|
|
EXPECT_EQ(zref.size(), y.size());
|
|
const T* x_data = x.data();
|
|
const T* y_data = y.data();
|
|
const T* zref_data = zref.data();
|
|
const int d = zref.size();
|
|
|
|
std::vector<T> ztgt(d);
|
|
T* ztgt_data = ztgt.data();
|
|
// test normal
|
|
tgt(x_data, y_data, ztgt_data, d);
|
|
ExpectEQ<T>(ztgt_data, zref_data, d);
|
|
// test inplace x
|
|
std::copy(x.begin(), x.end(), ztgt.begin());
|
|
tgt(ztgt_data, y_data, ztgt_data, d);
|
|
ExpectEQ<T>(ztgt_data, zref_data, d);
|
|
// test inplace y
|
|
std::copy(y.begin(), y.end(), ztgt.begin());
|
|
tgt(x_data, ztgt_data, ztgt_data, d);
|
|
ExpectEQ<T>(ztgt_data, zref_data, d);
|
|
}
|
|
};
|
|
|
|
template <typename T>
|
|
struct TestFuncWithRefer<jit::AXYNTuples<T>, T, std::vector<T>,
|
|
std::vector<T>> {
|
|
void operator()(const typename jit::AXYNTuples<T>::func_type tgt, const T a,
|
|
const std::vector<T>& x, const std::vector<T>& yref) {
|
|
EXPECT_TRUE(tgt != nullptr);
|
|
EXPECT_EQ(yref.size(), x.size());
|
|
const T* x_data = x.data();
|
|
const T* yref_data = yref.data();
|
|
const int d = yref.size();
|
|
std::vector<T> ytgt(d);
|
|
T* ytgt_data = ytgt.data();
|
|
// test normal
|
|
tgt(&a, x_data, ytgt_data, d);
|
|
ExpectEQ<T>(ytgt_data, yref_data, d);
|
|
// test inplace x
|
|
std::copy(x.begin(), x.end(), ytgt.begin());
|
|
tgt(&a, ytgt_data, ytgt_data, d);
|
|
ExpectEQ<T>(ytgt_data, yref_data, d);
|
|
}
|
|
};
|
|
|
|
template <typename T>
|
|
struct TestFuncWithRefer<jit::SoftmaxTuples<T>, std::vector<T>, std::vector<T>,
|
|
int, int> {
|
|
void operator()(const typename jit::SoftmaxTuples<T>::func_type tgt,
|
|
const std::vector<T>& x, const std::vector<T>& yref, int n,
|
|
int bs) {
|
|
EXPECT_TRUE(tgt != nullptr);
|
|
EXPECT_EQ(yref.size(), x.size());
|
|
EXPECT_EQ(x.size(), static_cast<size_t>(n * bs));
|
|
const T* x_data = x.data();
|
|
const T* yref_data = yref.data();
|
|
std::vector<T> ytgt(n * bs);
|
|
T* ytgt_data = ytgt.data();
|
|
// test normal
|
|
tgt(x_data, ytgt_data, n, bs);
|
|
ExpectEQ<T>(ytgt_data, yref_data, n * bs);
|
|
// test inplace x
|
|
std::copy(x.begin(), x.end(), ytgt.begin());
|
|
tgt(ytgt_data, ytgt_data, n, bs);
|
|
ExpectEQ<T>(ytgt_data, yref_data, n * bs);
|
|
}
|
|
};
|
|
|
|
template <typename T>
|
|
struct TestFuncWithRefer<jit::XRNTuples<T>, std::vector<T>, T> {
|
|
void operator()(const typename jit::XRNTuples<T>::func_type tgt,
|
|
const std::vector<T>& x, const T ref_res) {
|
|
EXPECT_TRUE(tgt != nullptr);
|
|
T tgt_res;
|
|
tgt(x.data(), &tgt_res, x.size());
|
|
ExpectEQ<T>(&tgt_res, &ref_res, 1);
|
|
}
|
|
};
|
|
|
|
template <typename T>
|
|
struct TestFuncWithRefer<jit::XYNTuples<T>, std::vector<T>, std::vector<T>> {
|
|
void operator()(const typename jit::XYNTuples<T>::func_type tgt,
|
|
const std::vector<T>& x, const std::vector<T>& yref) {
|
|
EXPECT_TRUE(tgt != nullptr);
|
|
EXPECT_EQ(yref.size(), x.size());
|
|
const T* x_data = x.data();
|
|
const T* yref_data = yref.data();
|
|
const int d = yref.size();
|
|
std::vector<T> ytgt(d);
|
|
T* ytgt_data = ytgt.data();
|
|
// test normal
|
|
tgt(x_data, ytgt_data, d);
|
|
ExpectEQ<T>(ytgt_data, yref_data, d);
|
|
// test inplace x
|
|
std::copy(x.begin(), x.end(), ytgt.begin());
|
|
tgt(ytgt_data, ytgt_data, d);
|
|
ExpectEQ<T>(ytgt_data, yref_data, d);
|
|
}
|
|
};
|
|
|
|
template <typename T>
|
|
struct TestFuncWithRefer<jit::LSTMTuples<T>, std::vector<T>, std::vector<T>,
|
|
std::vector<T>, std::vector<T>, std::vector<T>,
|
|
typename jit::LSTMTuples<T>::attr_type> {
|
|
void operator()(const typename jit::LSTMTuples<T>::func_type tgt,
|
|
const std::vector<T>& xsrc, const std::vector<T>& wp,
|
|
const std::vector<T>& ct_1, const std::vector<T>& ct_ref,
|
|
const std::vector<T>& ht_ref,
|
|
const typename jit::LSTMTuples<T>::attr_type& attr) {
|
|
EXPECT_TRUE(tgt != nullptr);
|
|
EXPECT_EQ(ct_ref.size(), ht_ref.size());
|
|
EXPECT_EQ(ct_1.size(), ht_ref.size());
|
|
EXPECT_EQ(xsrc.size(), 4 * ht_ref.size());
|
|
EXPECT_EQ(wp.size(), 3 * ht_ref.size());
|
|
|
|
// x could be changed after compute, so copy to save src
|
|
int d = ht_ref.size();
|
|
std::vector<T> x(xsrc.size()), ct(ct_ref.size()), ht(ht_ref.size());
|
|
std::vector<T> checked(2 * d);
|
|
std::copy(xsrc.begin(), xsrc.end(), x.begin());
|
|
|
|
const T* ct_1_data = ct_1.data();
|
|
const T* wp_data = wp.data();
|
|
const T* ct_ref_data = ct_ref.data();
|
|
const T* ht_ref_data = ht_ref.data();
|
|
T* x_data = x.data();
|
|
T* ct_data = ct.data();
|
|
T* ht_data = ht.data();
|
|
T* checked_data = checked.data();
|
|
|
|
jit::lstm_t step;
|
|
step.gates = x_data;
|
|
step.ct_1 = ct_1_data;
|
|
step.ct = ct_data;
|
|
step.ht = ht_data;
|
|
if (attr.use_peephole) {
|
|
step.wp = wp_data;
|
|
step.checked = checked_data;
|
|
}
|
|
|
|
tgt(&step, &attr);
|
|
ExpectEQ<T>(ct_data, ct_ref_data, d);
|
|
ExpectEQ<T>(ht_data, ht_ref_data, d);
|
|
}
|
|
};
|
|
|
|
template <typename T>
|
|
struct TestFuncWithRefer<jit::GRUTuples<T>, std::vector<T>, std::vector<T>,
|
|
std::vector<T>,
|
|
typename jit::GRUTuples<T>::attr_type> {
|
|
void operator()(const typename jit::GRUTuples<T>::func_type tgt,
|
|
const std::vector<T>& xsrc, const std::vector<T>& ht_1,
|
|
const std::vector<T>& ht_ref,
|
|
const typename jit::GRUTuples<T>::attr_type& attr) {
|
|
EXPECT_TRUE(tgt != nullptr);
|
|
EXPECT_EQ(ht_1.size(), ht_ref.size());
|
|
EXPECT_EQ(xsrc.size(), 3 * ht_ref.size());
|
|
|
|
// x could be changed after compute, so copy to save src
|
|
int d = ht_ref.size();
|
|
std::vector<T> x(xsrc.size()), ht(ht_ref.size());
|
|
std::copy(xsrc.begin(), xsrc.end(), x.begin());
|
|
const T* ht_1_data = ht_1.data();
|
|
const T* ht_ref_data = ht_ref.data();
|
|
T* x_data = x.data();
|
|
T* ht_data = ht.data();
|
|
jit::gru_t step;
|
|
step.gates = x_data;
|
|
step.ht_1 = ht_1_data;
|
|
step.ht = ht_data;
|
|
tgt(&step, &attr);
|
|
ExpectEQ<T>(ht_data, ht_ref_data, d);
|
|
}
|
|
};
|
|
|
|
template <typename T>
|
|
struct TestFuncWithRefer<jit::SeqPoolTuples<T>, std::vector<T>, std::vector<T>,
|
|
typename jit::SeqPoolTuples<T>::attr_type> {
|
|
void operator()(const typename jit::SeqPoolTuples<T>::func_type tgt,
|
|
const std::vector<T>& x, const std::vector<T>& yref,
|
|
const typename jit::SeqPoolTuples<T>::attr_type& attr) {
|
|
EXPECT_TRUE(tgt != nullptr);
|
|
EXPECT_EQ(x.size() % yref.size(), 0);
|
|
int w = yref.size();
|
|
std::vector<T> y(w);
|
|
const T* x_data = x.data();
|
|
const T* yref_data = yref.data();
|
|
T* y_data = y.data();
|
|
tgt(x_data, y_data, &attr);
|
|
ExpectEQ<T>(y_data, yref_data, w);
|
|
}
|
|
};
|
|
|
|
template <typename T>
|
|
struct TestFuncWithRefer<jit::MatMulTuples<T>, std::vector<T>, std::vector<T>,
|
|
std::vector<T>,
|
|
typename jit::MatMulTuples<T>::attr_type> {
|
|
void operator()(const typename jit::MatMulTuples<T>::func_type tgt,
|
|
const std::vector<T>& a, const std::vector<T>& b,
|
|
const std::vector<T>& cref,
|
|
const typename jit::MatMulTuples<T>::attr_type& attr) {
|
|
EXPECT_TRUE(tgt != nullptr);
|
|
EXPECT_EQ(a.size(), static_cast<size_t>(attr.m * attr.k));
|
|
EXPECT_EQ(b.size(), static_cast<size_t>(attr.k * attr.n));
|
|
EXPECT_EQ(cref.size(), static_cast<size_t>(attr.m * attr.n));
|
|
std::vector<T> c(cref.size());
|
|
const T* a_data = a.data();
|
|
const T* b_data = b.data();
|
|
const T* cref_data = cref.data();
|
|
T* c_data = c.data();
|
|
tgt(a_data, b_data, c_data, &attr);
|
|
ExpectEQ<T>(c_data, cref_data, attr.m * attr.n);
|
|
}
|
|
};
|
|
|
|
template <jit::KernelType KT, typename KernelTuples, typename PlaceType,
|
|
typename... Args>
|
|
void TestAllImpls(const typename KernelTuples::attr_type& attr, Args... args) {
|
|
TestFuncWithRefer<KernelTuples, Args...> test;
|
|
// test jitcode
|
|
auto jitcode = jit::GetJitCode<KT, KernelTuples, PlaceType>(attr);
|
|
if (jitcode) {
|
|
VLOG(10) << "Test Jitcode Kernel ";
|
|
test(jitcode, args...);
|
|
}
|
|
// test all impls in more
|
|
jit::KernelKey kkey(KT, PlaceType());
|
|
auto& pool = jit::KernelPool().Instance().AllKernels();
|
|
auto iter = pool.find(kkey);
|
|
if (iter != pool.end()) {
|
|
auto& impls = iter->second;
|
|
for (auto& impl : impls) {
|
|
auto i = dynamic_cast<const jit::KernelMore<KernelTuples>*>(impl.get());
|
|
if (i && i->UseMe(attr)) {
|
|
auto more = i->GetFunc();
|
|
VLOG(10) << "Test More Kernel : " << i->ImplType();
|
|
test(more, args...);
|
|
}
|
|
}
|
|
}
|
|
// test result from Get function
|
|
// VLOG(10) << "Test Get function ";
|
|
auto tgt = jit::Get<KT, KernelTuples, PlaceType>(attr);
|
|
test(tgt, args...);
|
|
}
|
|
|
|
template <jit::KernelType KT, typename T, typename PlaceType>
|
|
void TestXYZNKernel() {
|
|
VLOG(10) << "===== Test JITKernel " << jit::to_string(KT);
|
|
for (int d : TestSizes()) {
|
|
auto ref = jit::GetRefer<KT, jit::XYZNTuples<T>>();
|
|
EXPECT_TRUE(ref != nullptr);
|
|
|
|
std::vector<T> x(d), y(d), zref(d);
|
|
RandomVec<T>(d, x.data());
|
|
RandomVec<T>(d, y.data());
|
|
|
|
std::vector<T> xinp(d), yinp(d); // inplace test
|
|
std::copy(x.begin(), x.end(), xinp.begin());
|
|
std::copy(y.begin(), y.end(), yinp.begin());
|
|
|
|
const T* x_data = x.data();
|
|
const T* y_data = y.data();
|
|
T* zref_data = zref.data();
|
|
T* xinp_data = xinp.data();
|
|
T* yinp_data = yinp.data();
|
|
|
|
// test refer code inplace
|
|
ref(x_data, y_data, zref_data, d);
|
|
ref(x_data, yinp_data, yinp_data, d);
|
|
ref(xinp_data, y_data, xinp_data, d);
|
|
ExpectEQ<T>(xinp_data, zref_data, d);
|
|
ExpectEQ<T>(yinp_data, zref_data, d);
|
|
|
|
TestAllImpls<KT, jit::XYZNTuples<T>, PlaceType, std::vector<T>,
|
|
std::vector<T>, std::vector<T>>(d, x, y, zref);
|
|
}
|
|
}
|
|
|
|
template <jit::KernelType KT, typename T, typename PlaceType>
|
|
void TestAXYNKernel() {
|
|
VLOG(10) << "===== Test JITKernel " << jit::to_string(KT);
|
|
for (int d : TestSizes()) {
|
|
auto ref = jit::GetRefer<KT, jit::AXYNTuples<T>>();
|
|
EXPECT_TRUE(ref != nullptr);
|
|
|
|
const T a = static_cast<T>(3);
|
|
std::vector<T> x(d), yref(d);
|
|
std::vector<T> xinp(d); // inplace test
|
|
RandomVec<T>(d, x.data());
|
|
std::copy(x.begin(), x.end(), xinp.begin());
|
|
|
|
const T* x_data = x.data();
|
|
T* yref_data = yref.data();
|
|
T* xinp_data = xinp.data();
|
|
// test refer code inplace
|
|
ref(&a, x_data, yref_data, d);
|
|
ref(&a, xinp_data, xinp_data, d);
|
|
ExpectEQ<T>(xinp_data, yref_data, d);
|
|
|
|
TestAllImpls<KT, jit::AXYNTuples<T>, PlaceType, T, std::vector<T>,
|
|
std::vector<T>>(d, a, x, yref);
|
|
}
|
|
}
|
|
|
|
template <jit::KernelType KT, typename T, typename PlaceType>
|
|
void TestXRNKernel() {
|
|
VLOG(10) << "===== Test JITKernel " << jit::to_string(KT);
|
|
auto last_acc = FLAGS_acc;
|
|
FLAGS_acc = 1e-4;
|
|
for (int d : TestSizes()) {
|
|
auto ref = jit::GetRefer<KT, jit::XRNTuples<T>>();
|
|
EXPECT_TRUE(ref != nullptr);
|
|
std::vector<T> x(d);
|
|
RandomVec<T>(d, x.data(), -2.f, 2.f);
|
|
T ref_res;
|
|
ref(x.data(), &ref_res, d);
|
|
TestAllImpls<KT, jit::XRNTuples<T>, PlaceType, std::vector<T>, T>(d, x,
|
|
ref_res);
|
|
}
|
|
FLAGS_acc = last_acc;
|
|
}
|
|
|
|
template <jit::KernelType KT, typename T, typename PlaceType>
|
|
void TestXYNKernel() {
|
|
VLOG(10) << "===== Test JITKernel " << jit::to_string(KT);
|
|
for (int d : TestSizes()) {
|
|
auto ref = jit::GetRefer<KT, jit::XYNTuples<T>>();
|
|
EXPECT_TRUE(ref != nullptr);
|
|
|
|
std::vector<T> x(d), yref(d);
|
|
std::vector<T> xinp(d); // inplace test
|
|
RandomVec<T>(d, x.data(), -2.f, 2.f);
|
|
std::copy(x.begin(), x.end(), xinp.begin());
|
|
|
|
const T* x_data = x.data();
|
|
T* yref_data = yref.data();
|
|
T* xinp_data = xinp.data();
|
|
// test refer code inplace
|
|
ref(x_data, yref_data, d);
|
|
ref(xinp_data, xinp_data, d);
|
|
ExpectEQ<T>(xinp_data, yref_data, d);
|
|
|
|
TestAllImpls<KT, jit::XYNTuples<T>, PlaceType, std::vector<T>,
|
|
std::vector<T>>(d, x, yref);
|
|
}
|
|
}
|
|
|
|
template <jit::KernelType KT, typename T, typename PlaceType>
|
|
void TestLSTMKernel() {
|
|
VLOG(10) << "===== Test JITKernel " << jit::to_string(KT);
|
|
std::vector<std::string> all_acts = {"sigmoid", "tanh", "relu", "identity"};
|
|
for (int d : TestSizes()) {
|
|
for (bool use_peephole : {true, false}) {
|
|
for (auto& act_gate : all_acts) {
|
|
for (auto& act_cand : all_acts) {
|
|
for (auto& act_cell : all_acts) {
|
|
const jit::lstm_attr_t attr(
|
|
d, jit::to_kerneltype(act_gate), jit::to_kerneltype(act_cand),
|
|
jit::to_kerneltype(act_cell), use_peephole);
|
|
auto ref = jit::GetRefer<KT, jit::LSTMTuples<T>>();
|
|
EXPECT_TRUE(ref != nullptr);
|
|
std::vector<T> xsrc(4 * d), wp(3 * d), ct_1(d);
|
|
std::vector<T> ct_ref(d), ht_ref(d), checked(2 * d);
|
|
RandomVec<T>(4 * d, xsrc.data(), -2.f, 2.f);
|
|
RandomVec<T>(3 * d, wp.data(), -1.f, 1.f);
|
|
RandomVec<T>(d, ct_1.data(), -1.f, 1.f);
|
|
// x could be changed after compute, so copy to save src
|
|
std::vector<T> x(xsrc.size());
|
|
std::copy(xsrc.begin(), xsrc.end(), x.begin());
|
|
const T* ct_1_data = ct_1.data();
|
|
const T* wp_data = wp.data();
|
|
T* x_data = x.data();
|
|
T* checked_data = checked.data();
|
|
T* ct_ref_data = ct_ref.data();
|
|
T* ht_ref_data = ht_ref.data();
|
|
jit::lstm_t step;
|
|
step.gates = x_data;
|
|
step.ct_1 = ct_1_data;
|
|
step.ct = ct_ref_data;
|
|
step.ht = ht_ref_data;
|
|
if (use_peephole) {
|
|
step.wp = wp_data;
|
|
step.checked = checked_data;
|
|
}
|
|
ref(&step, &attr);
|
|
VLOG(10) << attr;
|
|
TestAllImpls<KT, jit::LSTMTuples<T>, PlaceType, std::vector<T>,
|
|
std::vector<T>, std::vector<T>, std::vector<T>,
|
|
std::vector<T>>(attr, xsrc, wp, ct_1, ct_ref, ht_ref,
|
|
attr);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
template <jit::KernelType KT, typename T, typename PlaceType>
|
|
void TestGRUKernel() {
|
|
VLOG(10) << "===== Test JITKernel " << jit::to_string(KT);
|
|
std::vector<std::string> all_acts = {"sigmoid", "tanh", "relu", "identity"};
|
|
for (int d : TestSizes()) {
|
|
for (auto& act_gate : all_acts) {
|
|
for (auto& act_cand : all_acts) {
|
|
const jit::gru_attr_t attr(d, jit::to_kerneltype(act_gate),
|
|
jit::to_kerneltype(act_cand));
|
|
auto ref = jit::GetRefer<KT, jit::GRUTuples<T>>();
|
|
EXPECT_TRUE(ref != nullptr);
|
|
std::vector<T> xsrc(3 * d), ht_1(d), ht_ref(d);
|
|
RandomVec<T>(3 * d, xsrc.data(), -2.f, 2.f);
|
|
RandomVec<T>(d, ht_1.data(), -2.f, 2.f);
|
|
// x could be changed after compute, so copy to save src
|
|
std::vector<T> x(xsrc.size());
|
|
std::copy(xsrc.begin(), xsrc.end(), x.begin());
|
|
const T* ht_1_data = ht_1.data();
|
|
T* x_data = x.data();
|
|
T* ht_ref_data = ht_ref.data();
|
|
jit::gru_t step;
|
|
step.gates = x_data;
|
|
step.ht_1 = ht_1_data;
|
|
step.ht = ht_ref_data;
|
|
ref(&step, &attr);
|
|
VLOG(10) << attr;
|
|
TestAllImpls<KT, jit::GRUTuples<T>, PlaceType, std::vector<T>,
|
|
std::vector<T>, std::vector<T>>(attr, xsrc, ht_1, ht_ref,
|
|
attr);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
template <jit::KernelType KT, typename T, typename PlaceType>
|
|
void TestSeqPoolKernel() {
|
|
VLOG(10) << "===== Test JITKernel " << jit::to_string(KT);
|
|
std::vector<jit::SeqPoolType> pool_types = {
|
|
jit::SeqPoolType::kSum, jit::SeqPoolType::kAvg, jit::SeqPoolType::kSqrt};
|
|
for (auto type : pool_types) {
|
|
for (int w : TestSizes()) {
|
|
jit::seq_pool_attr_t attr(w, type);
|
|
for (int h : TestSizes()) {
|
|
attr.h = h;
|
|
auto ref = jit::GetRefer<KT, jit::SeqPoolTuples<T>>();
|
|
EXPECT_TRUE(ref != nullptr);
|
|
std::vector<T> x(h * w), yref(w);
|
|
RandomVec<T>(h * w, x.data(), -2.f, 2.f);
|
|
const T* x_data = x.data();
|
|
T* yref_data = yref.data();
|
|
ref(x_data, yref_data, &attr);
|
|
VLOG(10) << attr;
|
|
TestAllImpls<KT, jit::SeqPoolTuples<T>, PlaceType, std::vector<T>,
|
|
std::vector<T>>(attr, x, yref, attr);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
template <jit::KernelType KT, typename T, typename PlaceType>
|
|
void TestMatMulKernel() {
|
|
VLOG(10) << "===== Test JITKernel " << jit::to_string(KT);
|
|
auto last_acc = FLAGS_acc;
|
|
// TODO(intel): fix MKL acc issue
|
|
// https://github.com/PaddlePaddle/Paddle/issues/15447
|
|
FLAGS_acc = 1e-3;
|
|
for (int m : {1, 2, 3, 4}) {
|
|
for (int n : {1, 2, 3, 4}) {
|
|
for (int k : TestSizes()) {
|
|
auto ref = jit::GetRefer<KT, jit::MatMulTuples<T>>();
|
|
EXPECT_TRUE(ref != nullptr);
|
|
std::vector<T> a(m * k), b(k * n), c(m * n);
|
|
RandomVec<T>(m * k, a.data(), -2.f, 2.f);
|
|
RandomVec<T>(k * n, b.data(), -2.f, 2.f);
|
|
const T* a_data = a.data();
|
|
const T* b_data = b.data();
|
|
T* c_data = c.data();
|
|
const jit::matmul_attr_t attr{m, n, k};
|
|
ref(a_data, b_data, c_data, &attr);
|
|
TestAllImpls<KT, jit::MatMulTuples<T>, PlaceType, std::vector<T>,
|
|
std::vector<T>, std::vector<T>>(attr, a, b, c, attr);
|
|
}
|
|
}
|
|
}
|
|
FLAGS_acc = last_acc;
|
|
}
|
|
|
|
template <jit::KernelType KT, typename T, typename PlaceType>
|
|
void TestSoftmaxKernel() {
|
|
VLOG(10) << "===== Test JITKernel " << jit::to_string(KT);
|
|
for (int bs : {1, 2, 10}) {
|
|
for (int n : TestSizes()) {
|
|
auto ref = jit::GetRefer<KT, jit::SoftmaxTuples<T>>();
|
|
EXPECT_TRUE(ref != nullptr);
|
|
std::vector<T> x(bs * n), y(bs * n);
|
|
RandomVec<T>(bs * n, x.data(), -2.f, 2.f);
|
|
const T* x_data = x.data();
|
|
T* y_data = y.data();
|
|
|
|
std::vector<T> xinp(x.size()); // inplace test
|
|
std::copy(x.begin(), x.end(), xinp.begin());
|
|
ref(x_data, y_data, n, bs);
|
|
T* xinp_data = xinp.data();
|
|
ref(xinp_data, xinp_data, n, bs);
|
|
ExpectEQ<T>(xinp_data, y_data, n * bs);
|
|
|
|
TestAllImpls<KT, jit::SoftmaxTuples<T>, PlaceType, std::vector<T>,
|
|
std::vector<T>>(n, x, y, n, bs);
|
|
}
|
|
}
|
|
}
|
|
|
|
template <jit::KernelType KT, typename T, typename PlaceType>
|
|
void TestNCHW16CMulNCKernel() {
|
|
VLOG(10) << "===== Test JITKernel " << jit::to_string(KT);
|
|
const int n = 3, c = 16 * 4, h = 10, w = 10;
|
|
auto ref = jit::GetRefer<KT, jit::NCHW16CMulNCTuples<T>>();
|
|
EXPECT_TRUE(ref != nullptr);
|
|
int sz = n * c * h * w;
|
|
std::vector<T> x(sz), y(n * c), zref(sz);
|
|
std::vector<T> ztgt(sz), zjit(sz);
|
|
RandomVec<T>(sz, x.data(), -2.f, 2.f);
|
|
RandomVec<T>(n * c, y.data(), -2.f, 2.f);
|
|
|
|
const T* x_data = x.data();
|
|
const T* y_data = y.data();
|
|
T* zref_data = zref.data();
|
|
T* ztgt_data = ztgt.data();
|
|
T* zjit_data = zjit.data();
|
|
constexpr int simd_width = ZMM_FLOAT_BLOCK;
|
|
int C = c / simd_width;
|
|
auto tgt = jit::Get<KT, jit::NCHW16CMulNCTuples<T>, PlaceType>(0);
|
|
auto jitcode = jit::GetJitCode<KT, jit::NCHW16CMulNCTuples<T>, PlaceType>(0);
|
|
EXPECT_TRUE(tgt != nullptr);
|
|
|
|
if (std::is_same<T, float>::value &&
|
|
paddle::platform::MayIUse(paddle::platform::avx512f)) {
|
|
EXPECT_TRUE(jitcode != nullptr);
|
|
}
|
|
for (int ni = 0; ni < n; ni++) {
|
|
for (int ci = 0; ci < C; ci++) {
|
|
auto ptr_x =
|
|
x_data + ni * C * h * w * simd_width + ci * h * w * simd_width;
|
|
auto ptr_y = y_data + ni * C * simd_width + ci * simd_width;
|
|
auto ptr_zref =
|
|
zref_data + ni * C * h * w * simd_width + ci * h * w * simd_width;
|
|
auto ptr_ztgt =
|
|
ztgt_data + ni * C * h * w * simd_width + ci * h * w * simd_width;
|
|
|
|
ref(ptr_x, ptr_y, ptr_zref, h, w);
|
|
tgt(ptr_x, ptr_y, ptr_ztgt, h, w);
|
|
|
|
if (jitcode) {
|
|
auto ptr_zjit =
|
|
zjit_data + ni * C * h * w * simd_width + ci * h * w * simd_width;
|
|
jitcode(ptr_x, ptr_y, ptr_zjit, h, w);
|
|
}
|
|
}
|
|
}
|
|
ExpectEQ<T>(ztgt_data, zref_data, sz);
|
|
if (jitcode) {
|
|
ExpectEQ<T>(zjit_data, zref_data, sz);
|
|
}
|
|
}
|
|
|
|
// XYZNTuple
|
|
TEST(JITKernel, kVMul) {
|
|
TestXYZNKernel<jit::kVMul, float, CPUPlace>();
|
|
TestXYZNKernel<jit::kVMul, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kVAdd) {
|
|
TestXYZNKernel<jit::kVAdd, float, CPUPlace>();
|
|
TestXYZNKernel<jit::kVAdd, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kVAddRelu) {
|
|
TestXYZNKernel<jit::kVAddRelu, float, CPUPlace>();
|
|
TestXYZNKernel<jit::kVAddRelu, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kVSub) {
|
|
TestXYZNKernel<jit::kVSub, float, CPUPlace>();
|
|
TestXYZNKernel<jit::kVSub, double, CPUPlace>();
|
|
}
|
|
|
|
// AXYNTuples
|
|
TEST(JITKernel, kVScal) {
|
|
TestAXYNKernel<jit::kVScal, float, CPUPlace>();
|
|
TestAXYNKernel<jit::kVScal, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kVAddBias) {
|
|
TestAXYNKernel<jit::kVAddBias, float, CPUPlace>();
|
|
TestAXYNKernel<jit::kVAddBias, double, CPUPlace>();
|
|
}
|
|
|
|
// XRNTuples
|
|
TEST(JITKernel, kHMax) {
|
|
TestXRNKernel<jit::kHMax, float, CPUPlace>();
|
|
TestXRNKernel<jit::kHMax, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kHSum) {
|
|
TestXRNKernel<jit::kHSum, float, CPUPlace>();
|
|
TestXRNKernel<jit::kHSum, double, CPUPlace>();
|
|
}
|
|
|
|
// XYNTuples
|
|
TEST(JITKernel, kVRelu) {
|
|
TestXYNKernel<jit::kVRelu, float, CPUPlace>();
|
|
TestXYNKernel<jit::kVRelu, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kVIdentity) {
|
|
TestXYNKernel<jit::kVIdentity, float, CPUPlace>();
|
|
TestXYNKernel<jit::kVIdentity, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kVSquare) {
|
|
TestXYNKernel<jit::kVSquare, float, CPUPlace>();
|
|
TestXYNKernel<jit::kVSquare, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kVExp) {
|
|
TestXYNKernel<jit::kVExp, float, CPUPlace>();
|
|
TestXYNKernel<jit::kVExp, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kVSigmoid) {
|
|
TestXYNKernel<jit::kVSigmoid, float, CPUPlace>();
|
|
TestXYNKernel<jit::kVSigmoid, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kVTanh) {
|
|
TestXYNKernel<jit::kVTanh, float, CPUPlace>();
|
|
TestXYNKernel<jit::kVTanh, double, CPUPlace>();
|
|
}
|
|
|
|
// LSTM
|
|
TEST(JITKernel, kLSTMCtHt) {
|
|
TestLSTMKernel<jit::kLSTMCtHt, float, CPUPlace>();
|
|
TestLSTMKernel<jit::kLSTMCtHt, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kLSTMC1H1) {
|
|
TestLSTMKernel<jit::kLSTMC1H1, float, CPUPlace>();
|
|
TestLSTMKernel<jit::kLSTMC1H1, double, CPUPlace>();
|
|
}
|
|
|
|
// GRU
|
|
TEST(JITKernel, kGRUH1) {
|
|
TestGRUKernel<jit::kGRUH1, float, CPUPlace>();
|
|
TestGRUKernel<jit::kGRUH1, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kGRUHtPart1) {
|
|
TestGRUKernel<jit::kGRUHtPart1, float, CPUPlace>();
|
|
TestGRUKernel<jit::kGRUHtPart1, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kGRUHtPart2) {
|
|
TestGRUKernel<jit::kGRUHtPart2, float, CPUPlace>();
|
|
TestGRUKernel<jit::kGRUHtPart2, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kSeqPool) {
|
|
TestSeqPoolKernel<jit::kSeqPool, float, CPUPlace>();
|
|
TestSeqPoolKernel<jit::kSeqPool, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kMatMul) {
|
|
TestMatMulKernel<jit::kMatMul, float, CPUPlace>();
|
|
TestMatMulKernel<jit::kMatMul, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kSoftmax) {
|
|
TestSoftmaxKernel<jit::kSoftmax, float, CPUPlace>();
|
|
TestSoftmaxKernel<jit::kSoftmax, double, CPUPlace>();
|
|
}
|
|
|
|
TEST(JITKernel, kNCHW16CMulNC) {
|
|
TestNCHW16CMulNCKernel<jit::kNCHW16CMulNC, float, CPUPlace>();
|
|
TestNCHW16CMulNCKernel<jit::kNCHW16CMulNC, double, CPUPlace>();
|
|
}
|
|
|
|
// TODO(yihua/TJ): add crf decoding and layer norm unit tests
|
|
|
|
TEST(JITKernel, pool) {
|
|
// TODO(TJ): add some test
|
|
}
|