From 841e075154c1b423595b54bca3569855b1652cc0 Mon Sep 17 00:00:00 2001 From: Igor Babuschkin Date: Sat, 6 Aug 2016 18:07:50 +0100 Subject: Remove CUDA >= 300 checks and enable outer reductin for doubles --- .../Eigen/CXX11/src/Tensor/TensorReductionCuda.h | 45 +++++----------------- 1 file changed, 9 insertions(+), 36 deletions(-) (limited to 'unsupported/Eigen/CXX11/src/Tensor/TensorReductionCuda.h') diff --git a/unsupported/Eigen/CXX11/src/Tensor/TensorReductionCuda.h b/unsupported/Eigen/CXX11/src/Tensor/TensorReductionCuda.h index c3bdc2783..af5c71247 100644 --- a/unsupported/Eigen/CXX11/src/Tensor/TensorReductionCuda.h +++ b/unsupported/Eigen/CXX11/src/Tensor/TensorReductionCuda.h @@ -23,7 +23,6 @@ namespace internal { // updated the content of the output address it will try again. template __device__ EIGEN_ALWAYS_INLINE void atomicReduce(T* output, T accum, R& reducer) { -#if __CUDA_ARCH__ >= 300 if (sizeof(T) == 4) { unsigned int oldval = *reinterpret_cast(output); @@ -62,9 +61,6 @@ __device__ EIGEN_ALWAYS_INLINE void atomicReduce(T* output, T accum, R& reducer) else { assert(0 && "Wordsize not supported"); } -#else - assert(0 && "Shouldn't be called on unsupported device"); -#endif } // We extend atomicExch to support extra data types @@ -82,7 +78,6 @@ __device__ inline double atomicExchCustom(double* address, double val) { #ifdef EIGEN_HAS_CUDA_FP16 template