90 for (
size_t i = 0;
i < out_range.size(); ++
i) out_range[
i] = in_range[
i] * broadcasts[
i];
97 for (IndexType
i = 0;
i < input.size(); ++
i) input(
i) =
static_cast<DataType
>(
i);
99 DataType* gpu_in_data =
100 static_cast<DataType*
>(sycl_device.allocate(input.dimensions().TotalSize() *
sizeof(DataType)));
101 DataType* gpu_out_data =
102 static_cast<DataType*
>(sycl_device.allocate(
out.dimensions().TotalSize() *
sizeof(DataType)));
106 sycl_device.memcpyHostToDevice(gpu_in_data, input.data(), (input.dimensions().TotalSize()) *
sizeof(DataType));
107 gpu_out.device(sycl_device) = gpu_in.broadcast(broadcasts);
108 sycl_device.memcpyDeviceToHost(
out.data(), gpu_out_data, (
out.dimensions().TotalSize()) *
sizeof(DataType));
110 for (IndexType
i = 0;
i < inDim1 * bDim1; ++
i) {
111 for (IndexType
j = 0;
j < inDim2 * bDim2; ++
j) {
112 for (IndexType
k = 0;
k < inDim3 * bDim3; ++
k) {
113 for (IndexType l = 0; l < inDim4 * bDim4; ++l) {
119 printf(
"Broadcast Test Passed\n");
120 sycl_device.deallocate(gpu_in_data);
121 sycl_device.deallocate(gpu_out_data);
int i
Definition: BiCGSTAB_step_by_step.cpp:9
A tensor expression mapping an existing array of data.
Definition: TensorMap.h:33
The tensor class.
Definition: Tensor.h:68
#define VERIFY_IS_APPROX(a, b)
Definition: integer_types.cpp:13
char char char int int * k
Definition: level2_impl.h:374
#define VERIFY_IS_EQUAL(a, b)
Definition: main.h:367
std::array< T, N > array
Definition: EmulateArray.h:231
std::ofstream out("Result.txt")
std::ptrdiff_t j
Definition: tut_arithmetic_redux_minmax.cpp:2