#include "utest_helper.hpp" #include #include template static void compiler_vector_load_store(int elemNum, const char *kernelName) { const size_t n = elemNum * 256; if (strstr(kernelName, "half") != NULL) if (!cl_check_half()) return; // Setup kernel and buffers if (strstr(kernelName, "half") != NULL) OCL_CALL(cl_kernel_init, "compiler_vector_load_store.cl", kernelName, SOURCE, "-DHALF"); else OCL_CREATE_KERNEL_FROM_FILE("compiler_vector_load_store", kernelName); buf_data[0] = (T*) malloc(sizeof(T) * n); for (uint32_t i = 0; i < n; ++i) { if (strstr(kernelName, "half") != NULL) ((T*)buf_data[0])[i] = __float_to_half(as_uint((float)i/(float)n)); else ((T*)buf_data[0])[i] = i; } OCL_CREATE_BUFFER(buf[0], CL_MEM_COPY_HOST_PTR, n * sizeof(T), buf_data[0]); OCL_CREATE_BUFFER(buf[1], 0, n * sizeof(T), NULL); free(buf_data[0]); buf_data[0] = NULL; // Run the kernel OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]); OCL_SET_ARG(1, sizeof(cl_mem), &buf[1]); globals[0] = n / elemNum; locals[0] = 16; OCL_NDRANGE(1); // Check result OCL_MAP_BUFFER(0); OCL_MAP_BUFFER(1); for (uint32_t i = 0; i < n; ++i) { int shift = ((i % elemNum) + 1); if (strstr(kernelName, "double") != NULL) OCL_ASSERT((((T*)buf_data[1])[i] - ((T)((T*)buf_data[0])[i] + shift)) < 1e-5); else if (strstr(kernelName, "half") != NULL) { float fdst = as_float(__half_to_float(((T*)buf_data[1])[i])); float fsrc = as_float(__half_to_float((T)(((T*)buf_data[0])[i]))); fsrc += shift; //printf("%d (%f, %f)\n",i, fdst, fsrc); OCL_ASSERT((fabs(fsrc - fdst) <= 0.03 * fabs(fdst))); } else OCL_ASSERT(((T*)buf_data[1])[i] == (T)(((T*)buf_data[0])[i] + shift)); } OCL_UNMAP_BUFFER(0); OCL_UNMAP_BUFFER(1); } #define compiler_vector_load_store(type, n, kernel_type, keep_program) \ static void compiler_vector_ ##kernel_type ##n ##_load_store(void)\ {\ compiler_vector_load_store(n, "test_" #kernel_type #n);\ }\ MAKE_UTEST_FROM_FUNCTION_KEEP_PROGRAM(compiler_vector_ ## kernel_type ##n ##_load_store, keep_program); #define test_all_vector(type, kernel_type, keep_program) \ compiler_vector_load_store(type, 2, kernel_type, true) \ compiler_vector_load_store(type, 3, kernel_type, true) \ compiler_vector_load_store(type, 4, kernel_type, true) \ compiler_vector_load_store(type, 8, kernel_type, true) \ compiler_vector_load_store(type, 16, kernel_type, keep_program) test_all_vector(int8_t, char, true) test_all_vector(uint8_t, uchar, true) test_all_vector(int16_t, short, true) test_all_vector(uint16_t, ushort, true) test_all_vector(int32_t, int, true) test_all_vector(uint32_t, uint, true) test_all_vector(float, float, true) //test_all_vector(double, double, true) test_all_vector(int64_t, long, true) test_all_vector(uint64_t, ulong, false) test_all_vector(uint16_t, half, false)