aboutsummaryrefslogtreecommitdiffhomepage
path: root/tensorflow/core/util/cuda_kernel_helper_test.cu.cc
diff options
context:
space:
mode:
authorGravatar A. Unique TensorFlower <gardener@tensorflow.org>2018-01-30 10:05:04 -0800
committerGravatar TensorFlower Gardener <gardener@tensorflow.org>2018-01-30 12:27:47 -0800
commit7149a2e2e2f549035f23e21224ee41afe8df3876 (patch)
tree4fab32a87362e9708d07f388154a10ccb0c7800b /tensorflow/core/util/cuda_kernel_helper_test.cu.cc
parent88eb6c61ef7659c2b5bb1ec6586c7d3cca5e4e9c (diff)
Cleanup: Ran clang-format on files in tensorflow/core/.../*.{cc,h}.
PiperOrigin-RevId: 183848459
Diffstat (limited to 'tensorflow/core/util/cuda_kernel_helper_test.cu.cc')
-rw-r--r--tensorflow/core/util/cuda_kernel_helper_test.cu.cc112
1 files changed, 56 insertions, 56 deletions
diff --git a/tensorflow/core/util/cuda_kernel_helper_test.cu.cc b/tensorflow/core/util/cuda_kernel_helper_test.cu.cc
index bd4c356ea0..732ed33ede 100644
--- a/tensorflow/core/util/cuda_kernel_helper_test.cu.cc
+++ b/tensorflow/core/util/cuda_kernel_helper_test.cu.cc
@@ -149,27 +149,27 @@ class CudaLaunchConfigTest : public ::testing::Test {
TEST_F(CudaLaunchConfigTest, GetCudaLaunchConfig) {
CudaLaunchConfig cfg;
- // test valid inputs
- #define TEST_LAUNCH_PARAMETER(work_element_count) \
- cfg = GetCudaLaunchConfig(bufsize, d); \
- SetOutbufZero<<<cfg.block_count, cfg.thread_per_block, 0, d.stream()>>> \
- (cfg, outbuf); \
- CUDA_ASSERT_SUCCESS \
- cfg = GetCudaLaunchConfig(work_element_count, d); \
- Count1D<<<cfg.block_count, cfg.thread_per_block, 0, d.stream()>>> ( \
- cfg, bufsize, outbuf); \
- CUDA_EXPECT_SUCCESS \
- EXPECT_EQ(work_element_count, std::accumulate(outbuf, outbuf + bufsize, 0));\
- \
- cfg = GetCudaLaunchConfig(bufsize, d, SetOutbufZero, 0, 0); \
- SetOutbufZero<<<cfg.block_count, cfg.thread_per_block, 0, d.stream()>>> \
- (cfg, outbuf); \
- CUDA_ASSERT_SUCCESS \
- cfg = GetCudaLaunchConfig(work_element_count, d, Count1D, 0, 0); \
- Count1D<<<cfg.block_count, cfg.thread_per_block, 0, d.stream()>>> ( \
- cfg, bufsize, outbuf); \
- CUDA_EXPECT_SUCCESS \
- EXPECT_EQ(work_element_count, std::accumulate(outbuf, outbuf + bufsize, 0))
+// test valid inputs
+#define TEST_LAUNCH_PARAMETER(work_element_count) \
+ cfg = GetCudaLaunchConfig(bufsize, d); \
+ SetOutbufZero<<<cfg.block_count, cfg.thread_per_block, 0, d.stream()>>>( \
+ cfg, outbuf); \
+ CUDA_ASSERT_SUCCESS \
+ cfg = GetCudaLaunchConfig(work_element_count, d); \
+ Count1D<<<cfg.block_count, cfg.thread_per_block, 0, d.stream()>>>( \
+ cfg, bufsize, outbuf); \
+ CUDA_EXPECT_SUCCESS \
+ EXPECT_EQ(work_element_count, std::accumulate(outbuf, outbuf + bufsize, 0)); \
+ \
+ cfg = GetCudaLaunchConfig(bufsize, d, SetOutbufZero, 0, 0); \
+ SetOutbufZero<<<cfg.block_count, cfg.thread_per_block, 0, d.stream()>>>( \
+ cfg, outbuf); \
+ CUDA_ASSERT_SUCCESS \
+ cfg = GetCudaLaunchConfig(work_element_count, d, Count1D, 0, 0); \
+ Count1D<<<cfg.block_count, cfg.thread_per_block, 0, d.stream()>>>( \
+ cfg, bufsize, outbuf); \
+ CUDA_EXPECT_SUCCESS \
+ EXPECT_EQ(work_element_count, std::accumulate(outbuf, outbuf + bufsize, 0))
TEST_LAUNCH_PARAMETER(128);
TEST_LAUNCH_PARAMETER(129);
@@ -181,7 +181,7 @@ TEST_F(CudaLaunchConfigTest, GetCudaLaunchConfig) {
TEST_LAUNCH_PARAMETER(8192);
TEST_LAUNCH_PARAMETER(123456);
TEST_LAUNCH_PARAMETER(1 << 30);
- #undef TEST_LAUNCH_PARAMETER
+#undef TEST_LAUNCH_PARAMETER
}
bool operator==(const Cuda2DLaunchConfig& a, const Cuda2DLaunchConfig& b) {
@@ -200,27 +200,27 @@ TEST_F(CudaLaunchConfigTest, GetCuda2DLaunchConfig) {
Cuda2DLaunchConfig cfg;
CudaLaunchConfig cfg1d;
- // test valid inputs
- #define TEST_LAUNCH_PARAMETER(dimx, dimy) \
- cfg1d = GetCudaLaunchConfig(bufsize, d); \
- SetOutbufZero<<<cfg1d.block_count, cfg1d.thread_per_block, 0, d.stream()>>> \
- (cfg1d, outbuf);\
- CUDA_ASSERT_SUCCESS \
- cfg = GetCuda2DLaunchConfig(dimx, dimy, d); \
- Count2D<<<cfg.block_count, cfg.thread_per_block, 0, d.stream()>>> ( \
- cfg, bufsize, outbuf); \
- CUDA_EXPECT_SUCCESS \
- EXPECT_EQ(dimx * dimy, std::accumulate(outbuf, outbuf + bufsize, 0)); \
- \
- cfg1d = GetCudaLaunchConfig(bufsize, d, SetOutbufZero, 0, 0); \
- SetOutbufZero<<<cfg1d.block_count, cfg1d.thread_per_block, 0, d.stream()>>> \
- (cfg1d, outbuf);\
- CUDA_ASSERT_SUCCESS \
- cfg = GetCuda2DLaunchConfig(dimx, dimy, d, Count2D, 0, 0); \
- Count2D<<<cfg.block_count, cfg.thread_per_block, 0, d.stream()>>> ( \
- cfg, bufsize, outbuf); \
- CUDA_EXPECT_SUCCESS \
- EXPECT_EQ(dimx * dimy, std::accumulate(outbuf, outbuf + bufsize, 0))
+// test valid inputs
+#define TEST_LAUNCH_PARAMETER(dimx, dimy) \
+ cfg1d = GetCudaLaunchConfig(bufsize, d); \
+ SetOutbufZero<<<cfg1d.block_count, cfg1d.thread_per_block, 0, d.stream()>>>( \
+ cfg1d, outbuf); \
+ CUDA_ASSERT_SUCCESS \
+ cfg = GetCuda2DLaunchConfig(dimx, dimy, d); \
+ Count2D<<<cfg.block_count, cfg.thread_per_block, 0, d.stream()>>>( \
+ cfg, bufsize, outbuf); \
+ CUDA_EXPECT_SUCCESS \
+ EXPECT_EQ(dimx* dimy, std::accumulate(outbuf, outbuf + bufsize, 0)); \
+ \
+ cfg1d = GetCudaLaunchConfig(bufsize, d, SetOutbufZero, 0, 0); \
+ SetOutbufZero<<<cfg1d.block_count, cfg1d.thread_per_block, 0, d.stream()>>>( \
+ cfg1d, outbuf); \
+ CUDA_ASSERT_SUCCESS \
+ cfg = GetCuda2DLaunchConfig(dimx, dimy, d, Count2D, 0, 0); \
+ Count2D<<<cfg.block_count, cfg.thread_per_block, 0, d.stream()>>>( \
+ cfg, bufsize, outbuf); \
+ CUDA_EXPECT_SUCCESS \
+ EXPECT_EQ(dimx* dimy, std::accumulate(outbuf, outbuf + bufsize, 0))
TEST_LAUNCH_PARAMETER(128, 128);
TEST_LAUNCH_PARAMETER(129, 64);
@@ -233,24 +233,24 @@ TEST_F(CudaLaunchConfigTest, GetCuda2DLaunchConfig) {
TEST_LAUNCH_PARAMETER(123456, 12);
TEST_LAUNCH_PARAMETER(1, 1 << 30);
TEST_LAUNCH_PARAMETER(1 << 30, 1);
- #undef TEST_LAUNCH_PARAMETER
+#undef TEST_LAUNCH_PARAMETER
}
TEST_F(CudaLaunchConfigTest, GetCuda3DLaunchConfig) {
Cuda3DLaunchConfig cfg;
CudaLaunchConfig cfg1d;
- // test valid inputs
- #define TEST_LAUNCH_PARAMETER(dimx, dimy, dimz) \
- cfg1d = GetCudaLaunchConfig(bufsize, d, SetOutbufZero, 0, 0); \
- SetOutbufZero<<<cfg1d.block_count, cfg1d.thread_per_block, 0, d.stream()>>> \
- (cfg1d, outbuf);\
- CUDA_ASSERT_SUCCESS \
- cfg = GetCuda3DLaunchConfig(dimx, dimy, dimz, d, Count3D, 0, 0); \
- Count3D<<<cfg.block_count, cfg.thread_per_block, 0, d.stream()>>> ( \
- cfg, bufsize, outbuf); \
- CUDA_EXPECT_SUCCESS \
- EXPECT_EQ(dimx * dimy * dimz, std::accumulate(outbuf, outbuf + bufsize, 0))
+// test valid inputs
+#define TEST_LAUNCH_PARAMETER(dimx, dimy, dimz) \
+ cfg1d = GetCudaLaunchConfig(bufsize, d, SetOutbufZero, 0, 0); \
+ SetOutbufZero<<<cfg1d.block_count, cfg1d.thread_per_block, 0, d.stream()>>>( \
+ cfg1d, outbuf); \
+ CUDA_ASSERT_SUCCESS \
+ cfg = GetCuda3DLaunchConfig(dimx, dimy, dimz, d, Count3D, 0, 0); \
+ Count3D<<<cfg.block_count, cfg.thread_per_block, 0, d.stream()>>>( \
+ cfg, bufsize, outbuf); \
+ CUDA_EXPECT_SUCCESS \
+ EXPECT_EQ(dimx* dimy* dimz, std::accumulate(outbuf, outbuf + bufsize, 0))
TEST_LAUNCH_PARAMETER(128, 128, 128);
TEST_LAUNCH_PARAMETER(129, 64, 1024);
@@ -264,7 +264,7 @@ TEST_F(CudaLaunchConfigTest, GetCuda3DLaunchConfig) {
TEST_LAUNCH_PARAMETER(1, 1, 1 << 30);
TEST_LAUNCH_PARAMETER(1, 1 << 30, 1);
TEST_LAUNCH_PARAMETER(1 << 30, 1, 1);
- #undef TEST_LAUNCH_PARAMETER
+#undef TEST_LAUNCH_PARAMETER
}
TEST(CudaDeviceFunctionsTest, ShuffleGetSrcLane) {