aboutsummaryrefslogtreecommitdiffhomepage
path: root/unsupported/test/cxx11_tensor_builtins_sycl.cpp
diff options
context:
space:
mode:
authorGravatar Luke Iwanski <luke@codeplay.com>2016-11-17 11:47:13 +0000
committerGravatar Luke Iwanski <luke@codeplay.com>2016-11-17 11:47:13 +0000
commitc5130dedbe67004895e515b82657c21343719a6d (patch)
treec14ab9c643a84f66b2c6f39b1d82d892870be0cb /unsupported/test/cxx11_tensor_builtins_sycl.cpp
parentb5c75351e3b094d81d0e90906a5d7222337d1f6f (diff)
Specialised basic math functions for SYCL device.
Diffstat (limited to 'unsupported/test/cxx11_tensor_builtins_sycl.cpp')
-rw-r--r--unsupported/test/cxx11_tensor_builtins_sycl.cpp83
1 files changed, 83 insertions, 0 deletions
diff --git a/unsupported/test/cxx11_tensor_builtins_sycl.cpp b/unsupported/test/cxx11_tensor_builtins_sycl.cpp
new file mode 100644
index 000000000..aed4e47e4
--- /dev/null
+++ b/unsupported/test/cxx11_tensor_builtins_sycl.cpp
@@ -0,0 +1,83 @@
+// This file is part of Eigen, a lightweight C++ template library
+// for linear algebra.
+//
+// Copyright (C) 2016
+// Mehdi Goli Codeplay Software Ltd.
+// Ralph Potter Codeplay Software Ltd.
+// Luke Iwanski Codeplay Software Ltd.
+// Contact: <eigen@codeplay.com>
+//
+// This Source Code Form is subject to the terms of the Mozilla
+// Public License v. 2.0. If a copy of the MPL was not distributed
+// with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
+
+#define EIGEN_TEST_NO_LONGDOUBLE
+#define EIGEN_TEST_NO_COMPLEX
+#define EIGEN_TEST_FUNC cxx11_tensor_builtins_sycl
+#define EIGEN_DEFAULT_DENSE_INDEX_TYPE int
+#define EIGEN_USE_SYCL
+
+#include "main.h"
+#include <unsupported/Eigen/CXX11/Tensor>
+
+using Eigen::array;
+using Eigen::SyclDevice;
+using Eigen::Tensor;
+using Eigen::TensorMap;
+
+namespace std
+{
+ template<typename T> T rsqrt(T x) { return 1/std::sqrt(x); }
+ template<typename T> T square(T x) { return x*x; }
+ template<typename T> T cube(T x) { return x*x*x; }
+ template<typename T> T inverse(T x) { return 1/x; }
+}
+
+#define TEST_UNARY_BUILTINS_FOR_SCALAR(FUNC, SCALAR) \
+{ \
+ Tensor<SCALAR, 3> in1(tensorRange); \
+ Tensor<SCALAR, 3> out1(tensorRange); \
+ in1 = in1.random(); \
+ SCALAR* gpu_data1 = static_cast<SCALAR*>(sycl_device.allocate(in1.size()*sizeof(SCALAR))); \
+ TensorMap<Tensor<SCALAR, 3>> gpu1(gpu_data1, tensorRange); \
+ sycl_device.memcpyHostToDevice(gpu_data1, in1.data(),(in1.size())*sizeof(SCALAR)); \
+ gpu1.device(sycl_device) = gpu1.FUNC(); \
+ sycl_device.memcpyDeviceToHost(out1.data(), gpu_data1,(out1.size())*sizeof(SCALAR)); \
+ for (int i = 0; i < in1.size(); ++i) { \
+ VERIFY_IS_APPROX(out1(i), std::FUNC(in1(i))); \
+ } \
+ sycl_device.deallocate(gpu_data1); \
+}
+
+#define TEST_UNARY_BUILTINS(SCALAR) \
+TEST_UNARY_BUILTINS_FOR_SCALAR(abs, SCALAR) \
+TEST_UNARY_BUILTINS_FOR_SCALAR(sqrt, SCALAR) \
+TEST_UNARY_BUILTINS_FOR_SCALAR(rsqrt, SCALAR) \
+TEST_UNARY_BUILTINS_FOR_SCALAR(square, SCALAR) \
+TEST_UNARY_BUILTINS_FOR_SCALAR(cube, SCALAR) \
+TEST_UNARY_BUILTINS_FOR_SCALAR(inverse, SCALAR) \
+TEST_UNARY_BUILTINS_FOR_SCALAR(tanh, SCALAR) \
+TEST_UNARY_BUILTINS_FOR_SCALAR(exp, SCALAR) \
+TEST_UNARY_BUILTINS_FOR_SCALAR(log, SCALAR) \
+TEST_UNARY_BUILTINS_FOR_SCALAR(abs, SCALAR) \
+TEST_UNARY_BUILTINS_FOR_SCALAR(ceil, SCALAR) \
+TEST_UNARY_BUILTINS_FOR_SCALAR(floor, SCALAR) \
+TEST_UNARY_BUILTINS_FOR_SCALAR(round, SCALAR) \
+TEST_UNARY_BUILTINS_FOR_SCALAR(log1p, SCALAR)
+
+static void test_builtin_unary_sycl(const Eigen::SyclDevice &sycl_device){
+ int sizeDim1 = 100;
+ int sizeDim2 = 100;
+ int sizeDim3 = 100;
+ array<int, 3> tensorRange = {{sizeDim1, sizeDim2, sizeDim3}};
+
+ TEST_UNARY_BUILTINS(float)
+ TEST_UNARY_BUILTINS(double)
+}
+
+
+void test_cxx11_tensor_builtins_sycl() {
+ cl::sycl::gpu_selector s;
+ Eigen::SyclDevice sycl_device(s);
+ CALL_SUBTEST(test_builtin_unary_sycl(sycl_device));
+}