|
|
|
@ -1,11 +1,8 @@
|
|
|
|
|
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
|
|
|
|
|
|
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
|
you may not use this file except in compliance with the License.
|
|
|
|
|
You may obtain a copy of the License at
|
|
|
|
|
|
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
|
|
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
|
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
@ -17,31 +14,19 @@ limitations under the License. */
|
|
|
|
|
#include "paddle/fluid/platform/float16.h"
|
|
|
|
|
|
|
|
|
|
namespace ops = paddle::operators;
|
|
|
|
|
namespace plat = paddle::platform;
|
|
|
|
|
|
|
|
|
|
#define REGISTER_ACTIVATION_CUDA_KERNEL(act_type, functor, grad_functor) \
|
|
|
|
|
REGISTER_OP_CUDA_KERNEL( \
|
|
|
|
|
act_type, ops::ActivationKernel<paddle::platform::CUDADeviceContext, \
|
|
|
|
|
ops::functor<float>>, \
|
|
|
|
|
ops::ActivationKernel<paddle::platform::CUDADeviceContext, \
|
|
|
|
|
ops::functor<double>>); \
|
|
|
|
|
act_type, \
|
|
|
|
|
ops::ActivationKernel<plat::CUDADeviceContext, ops::functor<float>>, \
|
|
|
|
|
ops::ActivationKernel<plat::CUDADeviceContext, ops::functor<double>>, \
|
|
|
|
|
ops::ActivationKernel<plat::CUDADeviceContext, \
|
|
|
|
|
ops::functor<plat::float16>>); \
|
|
|
|
|
REGISTER_OP_CUDA_KERNEL( \
|
|
|
|
|
act_type##_grad, \
|
|
|
|
|
ops::ActivationGradKernel<paddle::platform::CUDADeviceContext, \
|
|
|
|
|
act_type##_grad, ops::ActivationGradKernel<plat::CUDADeviceContext, \
|
|
|
|
|
ops::grad_functor<float>>, \
|
|
|
|
|
ops::ActivationGradKernel<paddle::platform::CUDADeviceContext, \
|
|
|
|
|
ops::ActivationGradKernel<plat::CUDADeviceContext, \
|
|
|
|
|
ops::grad_functor<double>>);
|
|
|
|
|
|
|
|
|
|
FOR_EACH_KERNEL_FUNCTOR(REGISTER_ACTIVATION_CUDA_KERNEL);
|
|
|
|
|
|
|
|
|
|
REGISTER_OP_CUDA_KERNEL(
|
|
|
|
|
relu, ops::ActivationKernel<paddle::platform::CUDADeviceContext,
|
|
|
|
|
ops::ReluFunctor<float>>,
|
|
|
|
|
ops::ActivationKernel<paddle::platform::CUDADeviceContext,
|
|
|
|
|
ops::ReluFunctor<double>>,
|
|
|
|
|
ops::ActivationKernel<paddle::platform::CUDADeviceContext,
|
|
|
|
|
ops::ReluFunctor<paddle::platform::float16>>);
|
|
|
|
|
REGISTER_OP_CUDA_KERNEL(
|
|
|
|
|
relu_grad, ops::ActivationGradKernel<paddle::platform::CUDADeviceContext,
|
|
|
|
|
ops::ReluGradFunctor<float>>,
|
|
|
|
|
ops::ActivationGradKernel<paddle::platform::CUDADeviceContext,
|
|
|
|
|
ops::ReluGradFunctor<double>>);
|
|
|
|
|