summaryrefslogtreecommitdiff
path: root/utests/compiler_uint3_unaligned_copy.cpp
blob: d42b4c3878e2a97452d0450b3ea4202b35515b6a (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
#include "utest_helper.hpp"

static void compiler_uint3_unaligned_copy(void)
{
  const size_t n = 128;

  // Setup kernel and buffers. Note that uint3 is aligned on 16 bytes
  // according to the OCL specification
  OCL_CREATE_KERNEL("compiler_uint3_unaligned_copy");
  buf_data[0] = (uint32_t*) malloc(sizeof(uint32_t[4]) * n);
  for (uint32_t i = 0; i < n; ++i) {
    ((uint32_t*)buf_data[0])[3*i+0] = 3*i+0;
    ((uint32_t*)buf_data[0])[3*i+1] = 3*i+1;
    ((uint32_t*)buf_data[0])[3*i+2] = 3*i+2;
  }

  OCL_CREATE_BUFFER(buf[0], CL_MEM_COPY_HOST_PTR, n * sizeof(uint32_t[4]), buf_data[0]);
  OCL_CREATE_BUFFER(buf[1], 0, n * sizeof(uint32_t[4]), NULL);
  free(buf_data[0]);
  buf_data[0] = NULL;

  // Run the kernel
  OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]);
  OCL_SET_ARG(1, sizeof(cl_mem), &buf[1]);
  globals[0] = n;
  locals[0] = 16;
  OCL_NDRANGE(1);

  // Check result
  OCL_MAP_BUFFER(0);
  OCL_MAP_BUFFER(1);
  for (uint32_t i = 0; i < n; ++i) {
    OCL_ASSERT(((uint32_t*)buf_data[0])[3*i+0] == ((uint32_t*)buf_data[1])[3*i+0]);
    OCL_ASSERT(((uint32_t*)buf_data[0])[3*i+1] == ((uint32_t*)buf_data[1])[3*i+1]);
    OCL_ASSERT(((uint32_t*)buf_data[0])[3*i+2] == ((uint32_t*)buf_data[1])[3*i+2]);
  }
}

MAKE_UTEST_FROM_FUNCTION(compiler_uint3_unaligned_copy);