Automated g4 rollback of changelist 179782067

PiperOrigin-RevId: 179861781
author: A. Unique TensorFlower <gardener@tensorflow.org> 2017-12-21 14:50:09 -0800
committer: TensorFlower Gardener <gardener@tensorflow.org> 2017-12-21 14:54:21 -0800
commit: e21952f86328d16d1a8a4ac5e100917a251d093f (patch)
tree: 1d9274230d915810cd78563f9952ee7ecf006408 /tensorflow/core/util/cuda_kernel_helper_test.cu.cc
parent: 7989a3aa026f93c1f45e1baf4ac37ad2a79156f9 (diff)
1 files changed, 6 insertions, 54 deletions
diff --git a/tensorflow/core/util/cuda_kernel_helper_test.cu.cc b/tensorflow/core/util/cuda_kernel_helper_test.cu.cc
index bd4c356ea0..6991554eff 100644
--- a/tensorflow/core/util/cuda_kernel_helper_test.cu.cc
+++ b/tensorflow/core/util/cuda_kernel_helper_test.cu.cc
@@ -52,11 +52,11 @@ __global__ void Count1D(CudaLaunchConfig config, int bufsize, int* outbuf) {
   }
 }
 __global__ void Count2D(Cuda2DLaunchConfig config, int bufsize, int* outbuf) {
-  CUDA_AXIS_KERNEL_LOOP(x, config.virtual_thread_count.x, X) {
+  CUDA_AXIS_KERNEL_LOOP(x, config.virtual_thread_count, x) {
     if (x < 0) {  // x might overflow when testing extreme case
       break;
     }
-    CUDA_AXIS_KERNEL_LOOP(y, config.virtual_thread_count.y, Y) {
+    CUDA_AXIS_KERNEL_LOOP(y, config.virtual_thread_count, y) {
       if (y < 0) {  // y might overflow when testing extreme case
         break;
       }
@@ -66,15 +66,15 @@ __global__ void Count2D(Cuda2DLaunchConfig config, int bufsize, int* outbuf) {
   }
 }
 __global__ void Count3D(Cuda3DLaunchConfig config, int bufsize, int* outbuf) {
-  CUDA_AXIS_KERNEL_LOOP(x, config.virtual_thread_count.x, X) {
+  CUDA_AXIS_KERNEL_LOOP(x, config.virtual_thread_count, x) {
     if (x < 0) {  // x might overflow when testing extreme case
       break;
     }
-    CUDA_AXIS_KERNEL_LOOP(y, config.virtual_thread_count.y, Y) {
+    CUDA_AXIS_KERNEL_LOOP(y, config.virtual_thread_count, y) {
       if (y < 0) {  // y might overflow when testing extreme case
         break;
       }
-      CUDA_AXIS_KERNEL_LOOP(z, config.virtual_thread_count.z, Z) {
+      CUDA_AXIS_KERNEL_LOOP(z, config.virtual_thread_count, z) {
         if (z < 0) {  // z might overflow when testing extreme case
           break;
         }
@@ -87,44 +87,6 @@ __global__ void Count3D(Cuda3DLaunchConfig config, int bufsize, int* outbuf) {
   }
 }
 
-__global__ void CudaShuffleGetSrcLaneTest(unsigned* failure_count) {
-  unsigned lane_id = CudaLaneId();
-  for (int width = warpSize; width > 1; width /= 2) {
-    auto check_result = [&](const char* op_name, int param, unsigned actual,
-                            unsigned expected) {
-      if (actual != expected) {
-        printf("Cuda%sGetSrcLane(%d, %d) for lane %d returned %d, not %d\n",
-               op_name, param, width, lane_id, actual, expected);
-        CudaAtomicAdd(failure_count, 1);
-      }
-    };
-    for (int src_lane = -warpSize; src_lane <= warpSize; ++src_lane) {
-      unsigned actual_lane = detail::CudaShuffleGetSrcLane(src_lane, width);
-      unsigned expect_lane =
-          CudaShuffleSync(kCudaWarpAll, lane_id, src_lane, width);
-      check_result("Shuffle", src_lane, actual_lane, expect_lane);
-    }
-    for (unsigned delta = 0; delta <= warpSize; ++delta) {
-      unsigned actual_lane = detail::CudaShuffleUpGetSrcLane(delta, width);
-      unsigned expect_lane =
-          CudaShuffleUpSync(kCudaWarpAll, lane_id, delta, width);
-      check_result("ShuffleUp", delta, actual_lane, expect_lane);
-    }
-    for (unsigned delta = 0; delta <= warpSize; ++delta) {
-      unsigned actual_lane = detail::CudaShuffleDownGetSrcLane(delta, width);
-      unsigned expect_lane =
-          CudaShuffleDownSync(kCudaWarpAll, lane_id, delta, width);
-      check_result("ShuffleDown", delta, actual_lane, expect_lane);
-    }
-    for (int lane_lane = warpSize; lane_lane > 0; lane_lane /= 2) {
-      unsigned actual_lane = detail::CudaShuffleXorGetSrcLane(lane_lane, width);
-      unsigned expect_lane =
-          CudaShuffleXorSync(kCudaWarpAll, lane_id, lane_lane, width);
-      check_result("ShuffleXor", lane_lane, actual_lane, expect_lane);
-    }
-  }
-}
-
 }  // namespace
 
 class CudaLaunchConfigTest : public ::testing::Test {
@@ -132,7 +94,7 @@ class CudaLaunchConfigTest : public ::testing::Test {
   const int bufsize = 1024;
   int* outbuf = nullptr;
   Eigen::CudaStreamDevice stream;
-  Eigen::GpuDevice d = Eigen::GpuDevice(&stream);
+  GPUDevice d = GPUDevice(&stream);
 
   virtual void SetUp() {
     cudaError_t err = cudaMallocManaged(&outbuf, sizeof(int) * bufsize);
@@ -267,16 +229,6 @@ TEST_F(CudaLaunchConfigTest, GetCuda3DLaunchConfig) {
   #undef TEST_LAUNCH_PARAMETER
 }
 
-TEST(CudaDeviceFunctionsTest, ShuffleGetSrcLane) {
-  unsigned* failure_count;
-  ASSERT_EQ(cudaMallocManaged(&failure_count, sizeof(unsigned)), cudaSuccess);
-  *failure_count = 0;
-  CudaShuffleGetSrcLaneTest<<<1, 32>>>(failure_count);
-  ASSERT_EQ(cudaDeviceSynchronize(), cudaSuccess);
-  ASSERT_EQ(*failure_count, 0);
-  cudaFree(failure_count);
-}
-
 }  // namespace tensorflow
 
 #endif  // GOOGLE_CUDA
author	A. Unique TensorFlower <gardener@tensorflow.org>	2017-12-21 14:50:09 -0800
committer	TensorFlower Gardener <gardener@tensorflow.org>	2017-12-21 14:54:21 -0800
commit	e21952f86328d16d1a8a4ac5e100917a251d093f (patch)
tree	1d9274230d915810cd78563f9952ee7ecf006408 /tensorflow/core/util/cuda_kernel_helper_test.cu.cc
parent	7989a3aa026f93c1f45e1baf4ac37ad2a79156f9 (diff)