Skip to content

Commit

Permalink
[SYCL][CUDA][LIT] Fix base address get and subbuffer LIT test
Browse files Browse the repository at this point in the history
This commit fixes a hardcoded value for base address alignment
in the cuda backend. Also a hardcoded value that should be
dependant on the base address alignment is fixed in the subbuffer
LIT test, which now passes on CUDA.

Signed-off-by: Przemek Malon <[email protected]>
  • Loading branch information
przemektmalon committed Jun 17, 2020
1 parent 358ec04 commit 788ac4e
Show file tree
Hide file tree
Showing 2 changed files with 12 additions and 12 deletions.
15 changes: 9 additions & 6 deletions sycl/plugins/cuda/pi_cuda.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -951,12 +951,15 @@ pi_result cuda_piDeviceGetInfo(pi_device device, pi_device_info param_name,
size_t{4000u});
}
case PI_DEVICE_INFO_MEM_BASE_ADDR_ALIGN: {
// TODO: is this config consistent across all NVIDIA GPUs?
// "The minimum value is the size (in bits) of the largest OpenCL built-in
// data type supported by the device"
// Hard coded to value returned by clinfo for OpenCL 1.2 CUDA | GeForce GTX
// 1060 3GB
return getInfo(param_value_size, param_value, param_value_size_ret, 4096u);
int mem_base_addr_align = 0;
cl::sycl::detail::pi::assertion(
cuDeviceGetAttribute(&mem_base_addr_align,
CU_DEVICE_ATTRIBUTE_TEXTURE_ALIGNMENT,
device->get()) == CUDA_SUCCESS);
// Multiply by 8 as clGetDeviceInfo returns this value in bits
mem_base_addr_align *= 8;
return getInfo(param_value_size, param_value, param_value_size_ret,
mem_base_addr_align);
}
case PI_DEVICE_INFO_HALF_FP_CONFIG: {
// TODO: is this config consistent across all NVIDIA GPUs?
Expand Down
9 changes: 3 additions & 6 deletions sycl/test/basic_tests/buffer/subbuffer.cpp
Original file line number Diff line number Diff line change
@@ -1,6 +1,3 @@
// XFAIL: cuda
// TODO: Fix CUDA implementation.
//
// RUN: %clangxx -fsycl -fsycl-targets=%sycl_triple %s -o %t.out
// RUN: env SYCL_DEVICE_TYPE=HOST %t.out
// RUN: %CPU_RUN_PLACEHOLDER %t.out
Expand Down Expand Up @@ -112,12 +109,12 @@ void check1DSubBuffer(cl::sycl::queue &q) {
assert(false && "Exception was caught");
}

for (int i = offset; i < subbuf_size; ++i)
assert(vec[i] == (i > 34 ? i * 10 : i * -10) &&
for (int i = offset; i < offset + subbuf_size; ++i)
assert(vec[i] == (i < offset + offset_inside_subbuf ? i * 10 : i * -10) &&
"Invalid result in 1d sub buffer");

for (int i = 0; i < subbuf_size; ++i)
assert(vec2[i] == (i < 3 ? (32 + i) : (32 + i) * -1) &&
assert(vec2[i] == (i < 3 ? (offset + i) : (offset + i) * -1) &&
"Invalid result in 1d sub buffer");
}

Expand Down

0 comments on commit 788ac4e

Please sign in to comment.