From 2e704d4257f235dd1f3224cd590e4fca4e3aaf96 Mon Sep 17 00:00:00 2001 From: Mehdi Goli Date: Thu, 10 Nov 2016 18:45:12 +0000 Subject: Adding Memset; optimising MecopyDeviceToHost by removing double copying; --- unsupported/test/cxx11_tensor_device_sycl.cpp | 13 +++++++++++++ 1 file changed, 13 insertions(+) (limited to 'unsupported/test/cxx11_tensor_device_sycl.cpp') diff --git a/unsupported/test/cxx11_tensor_device_sycl.cpp b/unsupported/test/cxx11_tensor_device_sycl.cpp index 7f79753c5..820bc88d0 100644 --- a/unsupported/test/cxx11_tensor_device_sycl.cpp +++ b/unsupported/test/cxx11_tensor_device_sycl.cpp @@ -19,10 +19,23 @@ #include "main.h" #include +#include void test_device_sycl(const Eigen::SyclDevice &sycl_device) { std::cout <<"Helo from ComputeCpp: the requested device exists and the device name is : " << sycl_device.m_queue.get_device(). template get_info() < tensorRange = {{sizeDim1}}; + Tensor in(tensorRange); + Tensor in1(tensorRange); + memset(in1.data(), 1,in1.dimensions().TotalSize()*sizeof(int)); + int * gpu_in_data = static_cast(sycl_device.allocate(in.dimensions().TotalSize()*sizeof(int))); + sycl_device.memset(gpu_in_data, 1,in.dimensions().TotalSize()*sizeof(int) ); + sycl_device.memcpyDeviceToHost(in.data(), gpu_in_data, in.dimensions().TotalSize()*sizeof(int) ); + for (int i=0; i