aboutsummaryrefslogtreecommitdiffhomepage
path: root/unsupported/Eigen/CXX11/src/Tensor/TensorDeviceCuda.h
diff options
context:
space:
mode:
authorGravatar Benoit Steiner <benoit.steiner.goog@gmail.com>2016-01-08 13:53:40 -0800
committerGravatar Benoit Steiner <benoit.steiner.goog@gmail.com>2016-01-08 13:53:40 -0800
commit53749ff4152191d2f1bd56090a14f6474fe059c2 (patch)
treedb47f940c3d31de9131dbc5a2c0019d6bf2b3bf7 /unsupported/Eigen/CXX11/src/Tensor/TensorDeviceCuda.h
parent6639b7d6e86ef36f6f78cf51e36efa5a004154eb (diff)
Prevent nvcc from miscompiling the cuda metakernel. Unfortunately this reintroduces some compulation warnings but it's much better than having to deal with random assertion failures.
Diffstat (limited to 'unsupported/Eigen/CXX11/src/Tensor/TensorDeviceCuda.h')
-rw-r--r--unsupported/Eigen/CXX11/src/Tensor/TensorDeviceCuda.h6
1 files changed, 1 insertions, 5 deletions
diff --git a/unsupported/Eigen/CXX11/src/Tensor/TensorDeviceCuda.h b/unsupported/Eigen/CXX11/src/Tensor/TensorDeviceCuda.h
index 4d7570077..af140a68b 100644
--- a/unsupported/Eigen/CXX11/src/Tensor/TensorDeviceCuda.h
+++ b/unsupported/Eigen/CXX11/src/Tensor/TensorDeviceCuda.h
@@ -238,14 +238,10 @@ struct GpuDevice {
};
-#ifndef __CUDA_ARCH__
#define LAUNCH_CUDA_KERNEL(kernel, gridsize, blocksize, sharedmem, device, ...) \
(kernel) <<< (gridsize), (blocksize), (sharedmem), (device).stream() >>> (__VA_ARGS__); \
assert(cudaGetLastError() == cudaSuccess);
-#else
-#define LAUNCH_CUDA_KERNEL(...) \
- eigen_assert(false && "Cannot launch a kernel from another kernel");
-#endif
+
// FIXME: Should be device and kernel specific.
#ifdef __CUDACC__