diff options
Diffstat (limited to 'tensorflow/core/kernels/sparse_xent_op_test.cc')
-rw-r--r-- | tensorflow/core/kernels/sparse_xent_op_test.cc | 78 |
1 files changed, 78 insertions, 0 deletions
diff --git a/tensorflow/core/kernels/sparse_xent_op_test.cc b/tensorflow/core/kernels/sparse_xent_op_test.cc new file mode 100644 index 0000000000..16335a9f1b --- /dev/null +++ b/tensorflow/core/kernels/sparse_xent_op_test.cc @@ -0,0 +1,78 @@ +/* Copyright 2015 Google Inc. All Rights Reserved. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. +==============================================================================*/ + +#include <random> + +#include "tensorflow/core/common_runtime/kernel_benchmark_testlib.h" +#include "tensorflow/core/kernels/xent_op.h" +#include "tensorflow/core/platform/test.h" +#include "tensorflow/core/platform/test_benchmark.h" +#include "tensorflow/core/public/tensor.h" + +namespace tensorflow { + +static Graph* SparseXent(int batch_size, int num_classes) { + Graph* g = new Graph(OpRegistry::Global()); + Tensor logits(DT_FLOAT, TensorShape({batch_size, num_classes})); + logits.flat<float>().setRandom(); + Tensor labels(DT_INT64, TensorShape({batch_size})); + std::random_device rd; + std::mt19937 gen(rd()); + std::uniform_int_distribution<> dist(0, num_classes - 1); + auto labels_t = labels.flat<int64>(); + for (int i = 0; i < batch_size; ++i) { + labels_t(i) = dist(gen); + } + test::graph::Binary(g, "SparseSoftmaxCrossEntropyWithLogits", + test::graph::Constant(g, logits), + test::graph::Constant(g, labels)); + return g; +} + +#define BM_SparseXentDev(BATCH, CLASS, DEVICE) \ + static void BM_SparseXent##_##BATCH##_##CLASS##_##DEVICE(int iters) { \ + testing::ItemsProcessed(static_cast<int64>(iters) * BATCH * CLASS); \ + test::Benchmark(#DEVICE, SparseXent(BATCH, CLASS)).Run(iters); \ + } \ + BENCHMARK(BM_SparseXent##_##BATCH##_##CLASS##_##DEVICE); + +/// The representative tests for ptb_word on GPU +BM_SparseXentDev(8, 1000000, gpu); + +BM_SparseXentDev(16, 10000, gpu); +BM_SparseXentDev(16, 30000, gpu); +BM_SparseXentDev(16, 100000, gpu); + +BM_SparseXentDev(32, 10000, gpu); +BM_SparseXentDev(32, 30000, gpu); +BM_SparseXentDev(32, 100000, gpu); + +BM_SparseXentDev(64, 10000, gpu); +BM_SparseXentDev(64, 30000, gpu); +BM_SparseXentDev(64, 100000, gpu); + +// CPU +BM_SparseXentDev(8, 1000000, cpu); + +BM_SparseXentDev(16, 10000, cpu); +BM_SparseXentDev(16, 100000, cpu); + +BM_SparseXentDev(32, 10000, cpu); +BM_SparseXentDev(32, 100000, cpu); + +BM_SparseXentDev(64, 10000, cpu); +BM_SparseXentDev(64, 100000, cpu); + +} // end namespace tensorflow |