|
|
|
@ -13,7 +13,7 @@
|
|
|
|
|
* limitations under the License. */
|
|
|
|
|
|
|
|
|
|
#include "paddle/fluid/operators/jit/kernel_key.h"
|
|
|
|
|
#include <xxhash.h>
|
|
|
|
|
#include <xxhash.h> // XXH64: 13.8 GB/s
|
|
|
|
|
#include "paddle/fluid/platform/enforce.h"
|
|
|
|
|
|
|
|
|
|
namespace paddle {
|
|
|
|
@ -21,73 +21,46 @@ namespace operators {
|
|
|
|
|
namespace jit {
|
|
|
|
|
|
|
|
|
|
template <>
|
|
|
|
|
size_t JitCodeKey<int>(const int& d) {
|
|
|
|
|
int64_t JitCodeKey<int>(const int& d) {
|
|
|
|
|
return d;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
template <>
|
|
|
|
|
size_t JitCodeKey<int64_t>(const int64_t& d) {
|
|
|
|
|
int64_t JitCodeKey<int64_t>(const int64_t& d) {
|
|
|
|
|
return d;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// TODO(TJ): refine and benchmark JitCodeKey generatation
|
|
|
|
|
constexpr int act_type_shift = 3; // suppot 2^3 act types
|
|
|
|
|
static inline int act_type_convert(KernelType type) {
|
|
|
|
|
if (type == kVIdentity) {
|
|
|
|
|
return 0;
|
|
|
|
|
} else if (type == kVExp) {
|
|
|
|
|
return 1;
|
|
|
|
|
} else if (type == kVRelu) {
|
|
|
|
|
return 2;
|
|
|
|
|
} else if (type == kVSigmoid) {
|
|
|
|
|
return 3;
|
|
|
|
|
} else if (type == kVTanh) {
|
|
|
|
|
return 4;
|
|
|
|
|
}
|
|
|
|
|
PADDLE_THROW("Unsupported act type %d", type);
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
template <>
|
|
|
|
|
size_t JitCodeKey<lstm_attr_t>(const lstm_attr_t& attr) {
|
|
|
|
|
// XXH64: 13.8 GB/s
|
|
|
|
|
|
|
|
|
|
size_t key = attr.d;
|
|
|
|
|
int gate_key = act_type_convert(attr.act_gate) << 1;
|
|
|
|
|
int cand_key = act_type_convert(attr.act_cand) << (1 + act_type_shift);
|
|
|
|
|
int cell_key = act_type_convert(attr.act_cell) << (1 + act_type_shift * 2);
|
|
|
|
|
return (key << (1 + act_type_shift * 3)) + gate_key + cand_key + cell_key +
|
|
|
|
|
attr.use_peephole;
|
|
|
|
|
int64_t JitCodeKey<gru_attr_t>(const gru_attr_t& attr) {
|
|
|
|
|
return XXH64(&attr, sizeof(gru_attr_t), 0);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
template <>
|
|
|
|
|
size_t JitCodeKey<gru_attr_t>(const gru_attr_t& attr) {
|
|
|
|
|
size_t key = attr.d;
|
|
|
|
|
return (key << (act_type_shift * 2)) + act_type_convert(attr.act_gate) +
|
|
|
|
|
(act_type_convert(attr.act_cand) << act_type_shift);
|
|
|
|
|
int64_t JitCodeKey<lstm_attr_t>(const lstm_attr_t& attr) {
|
|
|
|
|
int keys[5] = {
|
|
|
|
|
attr.d, static_cast<int>(attr.act_gate), static_cast<int>(attr.act_cand),
|
|
|
|
|
static_cast<int>(attr.act_cell), static_cast<int>(attr.use_peephole)};
|
|
|
|
|
return XXH64(keys, sizeof(int) * 5, 0);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
template <>
|
|
|
|
|
size_t JitCodeKey<seq_pool_attr_t>(const seq_pool_attr_t& attr) {
|
|
|
|
|
size_t key = attr.w;
|
|
|
|
|
constexpr int pool_type_shift = 3;
|
|
|
|
|
return (key << pool_type_shift) + static_cast<int>(attr.type);
|
|
|
|
|
int64_t JitCodeKey<seq_pool_attr_t>(const seq_pool_attr_t& attr) {
|
|
|
|
|
int keys[2] = {attr.w, static_cast<int>(attr.type)};
|
|
|
|
|
return XXH64(keys, sizeof(int) * 2, 0);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
template <>
|
|
|
|
|
size_t JitCodeKey<matmul_attr_t>(const matmul_attr_t& attr) {
|
|
|
|
|
size_t key = attr.m;
|
|
|
|
|
constexpr int shift = 21;
|
|
|
|
|
return (key << shift * 2) + ((static_cast<size_t>(attr.n)) << shift) + attr.k;
|
|
|
|
|
int64_t JitCodeKey<matmul_attr_t>(const matmul_attr_t& attr) {
|
|
|
|
|
return XXH64(&attr, sizeof(int) * 3, 0); // m, n, k
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
template <>
|
|
|
|
|
size_t JitCodeKey<emb_seq_pool_attr_t>(const emb_seq_pool_attr_t& attr) {
|
|
|
|
|
int64_t JitCodeKey<emb_seq_pool_attr_t>(const emb_seq_pool_attr_t& attr) {
|
|
|
|
|
return attr.table_width;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
template <>
|
|
|
|
|
size_t JitCodeKey<sgd_attr_t>(const sgd_attr_t& attr) {
|
|
|
|
|
int64_t JitCodeKey<sgd_attr_t>(const sgd_attr_t& attr) {
|
|
|
|
|
return attr.grad_width;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|