diff options
author | A. Unique TensorFlower <nobody@tensorflow.org> | 2016-04-18 08:05:42 -0800 |
---|---|---|
committer | TensorFlower Gardener <gardener@tensorflow.org> | 2016-04-18 09:12:23 -0700 |
commit | 517d3af445d85e2f6945fcdfc4fed4e46b1e0e35 (patch) | |
tree | 0a38b31e0aabf941effedfa2652298362ce9b28c /tensorflow/core/kernels/nn_ops_test.cc | |
parent | 3f27cffdae7cf9b1404d664b28be42b933908b0a (diff) |
Parallelize MaxPool across batch dimension.
Benchmark Base (ns) New (ns) Improvement
------------------------------------------------------------------
BM_MaxPool_32_112_112_64_3_3_2_VALID_1 28173747 28956041 -2.8%
BM_MaxPool_32_56_56_192_3_3_2_VALID_1 14467716 14581478 -0.8%
BM_MaxPool_32_28_28_352_3_3_2_VALID_1 5318842 5367336 -0.9%
BM_MaxPool_32_14_14_576_3_3_2_VALID_1 1331917 1351642 -1.5%
BM_MaxPool_32_112_112_64_3_3_2_SAME_1 28757024 29005280 -0.9%
BM_MaxPool_32_56_56_192_3_3_2_SAME_1 15119295 15478783 -2.4%
BM_MaxPool_32_28_28_352_3_3_2_SAME_1 5802450 5871220 -1.2%
BM_MaxPool_32_14_14_576_3_3_2_SAME_1 1632582 1662128 -1.8%
BM_MaxPool_32_112_112_64_3_3_2_VALID_4 28579650 8240771 +71.2%
BM_MaxPool_32_56_56_192_3_3_2_VALID_4 14621344 4373595 +70.1%
BM_MaxPool_32_28_28_352_3_3_2_VALID_4 5404303 1571711 +70.9%
BM_MaxPool_32_14_14_576_3_3_2_VALID_4 1343607 427873 +68.2%
BM_MaxPool_32_112_112_64_3_3_2_SAME_4 29195151 8204002 +71.9%
BM_MaxPool_32_56_56_192_3_3_2_SAME_4 15314088 4642979 +69.7%
BM_MaxPool_32_28_28_352_3_3_2_SAME_4 6094918 1777112 +70.8%
BM_MaxPool_32_14_14_576_3_3_2_SAME_4 1643584 544554 +66.9%
TESTED:
- passed opensource_build
- passed unit tests
Change: 120128184
Diffstat (limited to 'tensorflow/core/kernels/nn_ops_test.cc')
-rw-r--r-- | tensorflow/core/kernels/nn_ops_test.cc | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/tensorflow/core/kernels/nn_ops_test.cc b/tensorflow/core/kernels/nn_ops_test.cc index bfedbc40fe..52b6b2e1f6 100644 --- a/tensorflow/core/kernels/nn_ops_test.cc +++ b/tensorflow/core/kernels/nn_ops_test.cc @@ -908,10 +908,10 @@ MaxPooling Op static void BM_MaxPool(int iters, int batch_size, int rows, int cols, int depth, int kernel_rows, int kernel_cols, int stride, Padding padding, int num_threads, const string& label) { - testing::UseRealTime(); // TODO XXX tensorflow::testing::StopTiming(); SessionOptions options; options.config.set_intra_op_parallelism_threads(num_threads); + std::unique_ptr<Device> device( DeviceFactory::NewDevice("CPU", options, "/job:a/replica:0/task:0")); |