aboutsummaryrefslogtreecommitdiffhomepage
path: root/tensorflow/core/util/cuda_kernel_helper_test.cu.cc
diff options
context:
space:
mode:
authorGravatar A. Unique TensorFlower <gardener@tensorflow.org>2017-12-21 14:50:09 -0800
committerGravatar TensorFlower Gardener <gardener@tensorflow.org>2017-12-21 14:54:21 -0800
commite21952f86328d16d1a8a4ac5e100917a251d093f (patch)
tree1d9274230d915810cd78563f9952ee7ecf006408 /tensorflow/core/util/cuda_kernel_helper_test.cu.cc
parent7989a3aa026f93c1f45e1baf4ac37ad2a79156f9 (diff)
Automated g4 rollback of changelist 179782067
PiperOrigin-RevId: 179861781
Diffstat (limited to 'tensorflow/core/util/cuda_kernel_helper_test.cu.cc')
-rw-r--r--tensorflow/core/util/cuda_kernel_helper_test.cu.cc60
1 files changed, 6 insertions, 54 deletions
diff --git a/tensorflow/core/util/cuda_kernel_helper_test.cu.cc b/tensorflow/core/util/cuda_kernel_helper_test.cu.cc
index bd4c356ea0..6991554eff 100644
--- a/tensorflow/core/util/cuda_kernel_helper_test.cu.cc
+++ b/tensorflow/core/util/cuda_kernel_helper_test.cu.cc
@@ -52,11 +52,11 @@ __global__ void Count1D(CudaLaunchConfig config, int bufsize, int* outbuf) {
}
}
__global__ void Count2D(Cuda2DLaunchConfig config, int bufsize, int* outbuf) {
- CUDA_AXIS_KERNEL_LOOP(x, config.virtual_thread_count.x, X) {
+ CUDA_AXIS_KERNEL_LOOP(x, config.virtual_thread_count, x) {
if (x < 0) { // x might overflow when testing extreme case
break;
}
- CUDA_AXIS_KERNEL_LOOP(y, config.virtual_thread_count.y, Y) {
+ CUDA_AXIS_KERNEL_LOOP(y, config.virtual_thread_count, y) {
if (y < 0) { // y might overflow when testing extreme case
break;
}
@@ -66,15 +66,15 @@ __global__ void Count2D(Cuda2DLaunchConfig config, int bufsize, int* outbuf) {
}
}
__global__ void Count3D(Cuda3DLaunchConfig config, int bufsize, int* outbuf) {
- CUDA_AXIS_KERNEL_LOOP(x, config.virtual_thread_count.x, X) {
+ CUDA_AXIS_KERNEL_LOOP(x, config.virtual_thread_count, x) {
if (x < 0) { // x might overflow when testing extreme case
break;
}
- CUDA_AXIS_KERNEL_LOOP(y, config.virtual_thread_count.y, Y) {
+ CUDA_AXIS_KERNEL_LOOP(y, config.virtual_thread_count, y) {
if (y < 0) { // y might overflow when testing extreme case
break;
}
- CUDA_AXIS_KERNEL_LOOP(z, config.virtual_thread_count.z, Z) {
+ CUDA_AXIS_KERNEL_LOOP(z, config.virtual_thread_count, z) {
if (z < 0) { // z might overflow when testing extreme case
break;
}
@@ -87,44 +87,6 @@ __global__ void Count3D(Cuda3DLaunchConfig config, int bufsize, int* outbuf) {
}
}
-__global__ void CudaShuffleGetSrcLaneTest(unsigned* failure_count) {
- unsigned lane_id = CudaLaneId();
- for (int width = warpSize; width > 1; width /= 2) {
- auto check_result = [&](const char* op_name, int param, unsigned actual,
- unsigned expected) {
- if (actual != expected) {
- printf("Cuda%sGetSrcLane(%d, %d) for lane %d returned %d, not %d\n",
- op_name, param, width, lane_id, actual, expected);
- CudaAtomicAdd(failure_count, 1);
- }
- };
- for (int src_lane = -warpSize; src_lane <= warpSize; ++src_lane) {
- unsigned actual_lane = detail::CudaShuffleGetSrcLane(src_lane, width);
- unsigned expect_lane =
- CudaShuffleSync(kCudaWarpAll, lane_id, src_lane, width);
- check_result("Shuffle", src_lane, actual_lane, expect_lane);
- }
- for (unsigned delta = 0; delta <= warpSize; ++delta) {
- unsigned actual_lane = detail::CudaShuffleUpGetSrcLane(delta, width);
- unsigned expect_lane =
- CudaShuffleUpSync(kCudaWarpAll, lane_id, delta, width);
- check_result("ShuffleUp", delta, actual_lane, expect_lane);
- }
- for (unsigned delta = 0; delta <= warpSize; ++delta) {
- unsigned actual_lane = detail::CudaShuffleDownGetSrcLane(delta, width);
- unsigned expect_lane =
- CudaShuffleDownSync(kCudaWarpAll, lane_id, delta, width);
- check_result("ShuffleDown", delta, actual_lane, expect_lane);
- }
- for (int lane_lane = warpSize; lane_lane > 0; lane_lane /= 2) {
- unsigned actual_lane = detail::CudaShuffleXorGetSrcLane(lane_lane, width);
- unsigned expect_lane =
- CudaShuffleXorSync(kCudaWarpAll, lane_id, lane_lane, width);
- check_result("ShuffleXor", lane_lane, actual_lane, expect_lane);
- }
- }
-}
-
} // namespace
class CudaLaunchConfigTest : public ::testing::Test {
@@ -132,7 +94,7 @@ class CudaLaunchConfigTest : public ::testing::Test {
const int bufsize = 1024;
int* outbuf = nullptr;
Eigen::CudaStreamDevice stream;
- Eigen::GpuDevice d = Eigen::GpuDevice(&stream);
+ GPUDevice d = GPUDevice(&stream);
virtual void SetUp() {
cudaError_t err = cudaMallocManaged(&outbuf, sizeof(int) * bufsize);
@@ -267,16 +229,6 @@ TEST_F(CudaLaunchConfigTest, GetCuda3DLaunchConfig) {
#undef TEST_LAUNCH_PARAMETER
}
-TEST(CudaDeviceFunctionsTest, ShuffleGetSrcLane) {
- unsigned* failure_count;
- ASSERT_EQ(cudaMallocManaged(&failure_count, sizeof(unsigned)), cudaSuccess);
- *failure_count = 0;
- CudaShuffleGetSrcLaneTest<<<1, 32>>>(failure_count);
- ASSERT_EQ(cudaDeviceSynchronize(), cudaSuccess);
- ASSERT_EQ(*failure_count, 0);
- cudaFree(failure_count);
-}
-
} // namespace tensorflow
#endif // GOOGLE_CUDA