From 083566732937f5f57a4bfcaa68c46da795f465ab Mon Sep 17 00:00:00 2001 From: Benoit Steiner Date: Tue, 24 May 2016 23:11:56 -0700 Subject: There is no need to make the fp16 full reduction kernel a static function. --- unsupported/Eigen/CXX11/src/Tensor/TensorReductionCuda.h | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) (limited to 'unsupported/Eigen/CXX11/src/Tensor/TensorReductionCuda.h') diff --git a/unsupported/Eigen/CXX11/src/Tensor/TensorReductionCuda.h b/unsupported/Eigen/CXX11/src/Tensor/TensorReductionCuda.h index 63646dfc2..c0a36cd9c 100644 --- a/unsupported/Eigen/CXX11/src/Tensor/TensorReductionCuda.h +++ b/unsupported/Eigen/CXX11/src/Tensor/TensorReductionCuda.h @@ -159,7 +159,7 @@ __global__ void ReductionInitKernelHalfFloat(Reducer reducer, const Self input, template -static __global__ void FullReductionKernelHalfFloat(Reducer reducer, const Self input, Index num_coeffs, +__global__ void FullReductionKernelHalfFloat(Reducer reducer, const Self input, Index num_coeffs, half* output, half2* scratch) { eigen_assert(NumPerThread % 2 == 0); -- cgit v1.2.3