summaryrefslogtreecommitdiff
path: root/src
diff options
context:
space:
mode:
authorPan Xiuli <xiuli.pan@intel.com>2016-05-12 09:09:50 +0800
committerYang Rong <rong.r.yang@intel.com>2016-06-13 17:02:09 +0800
commitaa3ee67c825fbef5f68b31345c060c981bf35ad3 (patch)
treeef90a2bf68fc6545e0e82611b2b1ffe923d1a3a8 /src
parentda7eff067fd81fcb99025b2548d18fcb79beee7b (diff)
downloadbeignet-aa3ee67c825fbef5f68b31345c060c981bf35ad3.tar.gz
Runtime: Add API clGetKernelSubGroupInfoKHR for subgroup extension
Signed-off-by: Pan Xiuli <xiuli.pan@intel.com> Reviewed-by: Yang Rong <rong.r.yang@intel.com>
Diffstat (limited to 'src')
-rw-r--r--src/cl_api.c20
-rw-r--r--src/cl_device_id.c83
-rw-r--r--src/cl_device_id.h9
3 files changed, 112 insertions, 0 deletions
diff --git a/src/cl_api.c b/src/cl_api.c
index 881ea6dc..85ed4cff 100644
--- a/src/cl_api.c
+++ b/src/cl_api.c
@@ -1348,6 +1348,26 @@ clGetKernelWorkGroupInfo(cl_kernel kernel,
}
cl_int
+clGetKernelSubGroupInfoKHR(cl_kernel kernel,
+ cl_device_id device,
+ cl_kernel_work_group_info param_name,
+ size_t input_value_size,
+ const void * input_value,
+ size_t param_value_size,
+ void * param_value,
+ size_t * param_value_size_ret)
+{
+ return cl_get_kernel_subgroup_info(kernel,
+ device,
+ param_name,
+ input_value_size,
+ input_value,
+ param_value_size,
+ param_value,
+ param_value_size_ret);
+}
+
+cl_int
clWaitForEvents(cl_uint num_events,
const cl_event * event_list)
{
diff --git a/src/cl_device_id.c b/src/cl_device_id.c
index 00d014bb..66666ea7 100644
--- a/src/cl_device_id.c
+++ b/src/cl_device_id.c
@@ -27,6 +27,7 @@
#include "cl_thread.h"
#include "CL/cl.h"
#include "CL/cl_ext.h"
+#include "CL/cl_intel.h"
#include "cl_gbe_loader.h"
#include "cl_alloc.h"
@@ -1088,3 +1089,85 @@ error:
return err;
}
+LOCAL cl_int
+cl_get_kernel_subgroup_info(cl_kernel kernel,
+ cl_device_id device,
+ cl_kernel_work_group_info param_name,
+ size_t input_value_size,
+ const void* input_value,
+ size_t param_value_size,
+ void* param_value,
+ size_t* param_value_size_ret)
+{
+ int err = CL_SUCCESS;
+ if(device != NULL)
+ if (kernel->program->ctx->device != device)
+ return CL_INVALID_DEVICE;
+
+ CHECK_KERNEL(kernel);
+ switch (param_name) {
+ case CL_KERNEL_MAX_SUB_GROUP_SIZE_FOR_NDRANGE_KHR:
+ {
+ int i, dim = 0;
+ size_t local_sz = 1;
+ if (param_value && param_value_size < sizeof(size_t))
+ return CL_INVALID_VALUE;
+ if (param_value_size_ret != NULL)
+ *param_value_size_ret = sizeof(size_t);
+ switch (input_value_size)
+ {
+ case sizeof(size_t)*1:
+ case sizeof(size_t)*2:
+ case sizeof(size_t)*3:
+ dim = input_value_size/sizeof(size_t);
+ break;
+ default: return CL_INVALID_VALUE;
+ }
+ if (input_value == NULL )
+ return CL_INVALID_VALUE;
+ for(i = 0; i < dim; i++)
+ local_sz *= ((size_t*)input_value)[i];
+ if (param_value) {
+ size_t simd_sz = cl_kernel_get_simd_width(kernel);
+ size_t sub_group_size = local_sz >= simd_sz? simd_sz : local_sz;
+ *(size_t*)param_value = sub_group_size;
+ return CL_SUCCESS;
+ }
+ break;
+ }
+ case CL_KERNEL_SUB_GROUP_COUNT_FOR_NDRANGE_KHR:
+ {
+ int i, dim = 0;
+ size_t local_sz = 1;
+ if (param_value && param_value_size < sizeof(size_t))
+ return CL_INVALID_VALUE;
+ if (param_value_size_ret != NULL)
+ *param_value_size_ret = sizeof(size_t);
+ switch (input_value_size)
+ {
+ case sizeof(size_t)*1:
+ case sizeof(size_t)*2:
+ case sizeof(size_t)*3:
+ dim = input_value_size/sizeof(size_t);
+ break;
+ default: return CL_INVALID_VALUE;
+ }
+ if (input_value == NULL )
+ return CL_INVALID_VALUE;
+ for(i = 0; i < dim; i++)
+ local_sz *= ((size_t*)input_value)[i];
+ if (param_value) {
+ size_t simd_sz = cl_kernel_get_simd_width(kernel);
+ size_t sub_group_num = (local_sz + simd_sz - 1) / simd_sz;
+ *(size_t*)param_value = sub_group_num;
+ return CL_SUCCESS;
+ }
+ break;
+ }
+ default:
+ return CL_INVALID_VALUE;
+ };
+
+error:
+ return err;
+}
diff --git a/src/cl_device_id.h b/src/cl_device_id.h
index b01a6fb4..7db125b6 100644
--- a/src/cl_device_id.h
+++ b/src/cl_device_id.h
@@ -149,6 +149,15 @@ extern cl_int cl_get_kernel_workgroup_info(cl_kernel kernel,
size_t param_value_size,
void * param_value,
size_t * param_value_size_ret);
+
+extern cl_int cl_get_kernel_subgroup_info(cl_kernel kernel,
+ cl_device_id device,
+ cl_kernel_work_group_info param_name,
+ size_t input_value_size,
+ const void * input_value,
+ size_t param_value_size,
+ void * param_value,
+ size_t * param_value_size_ret);
/* Returns the Gen device ID */
extern cl_int cl_device_get_version(cl_device_id device, cl_int *ver);
extern size_t cl_get_kernel_max_wg_sz(cl_kernel);