74 std::vector<DenseIndex> dims;
75 dims.push_back(sizeDim0);
76 dims.push_back(sizeDim1);
77 dims.push_back(sizeDim2);
78 dims.push_back(sizeDim3);
81 for (
DenseIndex d = 0; d < 3; ++d) out_shape[d] = (d < dim) ? dims[d] : dims[d + 1];
96 tensor(ix) =
static_cast<DataType
>((ix[dim] != 0) ? -1.0 : 10.0);
102 std::size_t in_bytes = tensor.size() *
sizeof(DataType);
103 std::size_t out_bytes = tensor_arg.size() *
sizeof(
DenseIndex);
105 DataType* d_in =
static_cast<DataType*
>(sycl_device.allocate(in_bytes));
112 sycl_device.memcpyHostToDevice(d_in, tensor.data(), in_bytes);
113 gpu_out.device(sycl_device) = gpu_in.argmax(dim);
114 sycl_device.memcpyDeviceToHost(tensor_arg.data(), d_out, out_bytes);
117 size_t(sizeDim0 * sizeDim1 * sizeDim2 * sizeDim3 / tensor.dimension(dim)));
124 sycl_device.synchronize();
135 tensor(ix) =
static_cast<DataType
>((ix[dim] != tensor.dimension(dim) - 1) ? -1.0 : 20.0);
141 sycl_device.memcpyHostToDevice(d_in, tensor.data(), in_bytes);
142 gpu_out.device(sycl_device) = gpu_in.argmax(dim);
143 sycl_device.memcpyDeviceToHost(tensor_arg.data(), d_out, out_bytes);
149 sycl_device.deallocate(d_in);
150 sycl_device.deallocate(d_out);
int i
Definition: BiCGSTAB_step_by_step.cpp:9
const unsigned n
Definition: CG3DPackingUnitTest.cpp:11
A tensor expression mapping an existing array of data.
Definition: TensorMap.h:33
The tensor class.
Definition: Tensor.h:68
char char char int int * k
Definition: level2_impl.h:374
#define VERIFY_IS_EQUAL(a, b)
Definition: main.h:367
std::array< T, N > array
Definition: EmulateArray.h:231
EIGEN_DEFAULT_DENSE_INDEX_TYPE DenseIndex
Definition: Meta.h:75
std::ptrdiff_t j
Definition: tut_arithmetic_redux_minmax.cpp:2