fix atomicAdd -> CudaAtomicAdd

8 years ago · e21e5646a5
parent 6c6474cbd8
commit e21e5646a5
1 changed files with 4 additions and 8 deletions
--- a/paddle/operators/math/pooling.cu
+++ b/paddle/operators/math/pooling.cu
@ -144,7 +144,7 @@ __global__ void KernelMaxPool2DGrad(

    if (maxIndex != -1) {
      // atomic add
-      atomicAdd(input_grad + maxIndex, output_grad[index]);
+      platform::CudaAtomicAdd(input_grad + maxIndex, output_grad[index]);
    }
  }
 }
@ -278,9 +278,7 @@ class MaxPool2dGradFunctor<platform::GPUPlace, T> {
 };

 template class MaxPool2dGradFunctor<platform::GPUPlace, float>;
-// template class MaxPool2dGradFunctor<platform::GPUPlace, double>; // The
-// 64-bit floating-point version of atomicAdd() is only supported by devices of
-// compute capability 6.x and higher.
+template class MaxPool2dGradFunctor<platform::GPUPlace, double>;

 template class Pool2dFunctor<platform::GPUPlace,
                             paddle::operators::math::MaxPool<float>, float>;
@ -453,7 +451,7 @@ __global__ void KernelMaxPool3DGrad(
    }
    if (maxIdx != -1) {
      // atomic add
-      atomicAdd(input_grad + maxIdx, output_grad[index]);
+      platform::CudaAtomicAdd(input_grad + maxIdx, output_grad[index]);
    }
  }
 }
@ -609,9 +607,7 @@ class MaxPool3dGradFunctor<platform::GPUPlace, T> {
 };

 template class MaxPool3dGradFunctor<platform::GPUPlace, float>;
-// template class MaxPool3dGradFunctor<platform::GPUPlace, double>;  // The
-// 64-bit floating-point version of atomicAdd() is only supported by devices of
-// compute capability 6.x and higher.
+template class MaxPool3dGradFunctor<platform::GPUPlace, double>;

 template class Pool3dFunctor<platform::GPUPlace,
                             paddle::operators::math::MaxPool<float>, float>;