diff options
Diffstat (limited to 'utests/compiler_get_max_sub_group_size.cpp')
-rw-r--r-- | utests/compiler_get_max_sub_group_size.cpp | 32 |
1 files changed, 32 insertions, 0 deletions
diff --git a/utests/compiler_get_max_sub_group_size.cpp b/utests/compiler_get_max_sub_group_size.cpp new file mode 100644 index 00000000..debdf940 --- /dev/null +++ b/utests/compiler_get_max_sub_group_size.cpp @@ -0,0 +1,32 @@ +#include "utest_helper.hpp" + +void compiler_get_max_sub_group_size(void) +{ + const size_t n = 256; + + // Setup kernel and buffers + OCL_CREATE_KERNEL("compiler_get_max_sub_group_size"); + OCL_CREATE_BUFFER(buf[0], 0, n * sizeof(int), NULL); + OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]); + + globals[0] = n; + locals[0] = 16; + + OCL_MAP_BUFFER(0); + for (int32_t i = 0; i < (int32_t) n; ++i) + ((int*)buf_data[0])[i] = -1; + OCL_UNMAP_BUFFER(0); + + // Run the kernel on GPU + OCL_NDRANGE(1); + + // Compare + OCL_MAP_BUFFER(0); + int* dst = (int *)buf_data[0]; + for (int32_t i = 0; i < (int32_t) n; ++i){ + OCL_ASSERT(8 == dst[i] || 16 == dst[i]); + } + OCL_UNMAP_BUFFER(0); +} + +MAKE_UTEST_FROM_FUNCTION(compiler_get_max_sub_group_size); |