summaryrefslogtreecommitdiff
path: root/src/cl_api.c
diff options
context:
space:
mode:
authorZhigang Gong <zhigang.gong@intel.com>2015-11-12 16:47:04 +0800
committerYang Rong <rong.r.yang@intel.com>2015-11-25 11:45:13 +0800
commit06b0298cb481f936f84e9e9af8fae0763574d3fd (patch)
tree31f2ec7fbca0d3be53d019cd690f4f30ab68b2f2 /src/cl_api.c
parent5d5aa6085ea0724ecea7471f4b710d8f21e206bc (diff)
downloadbeignet-06b0298cb481f936f84e9e9af8fae0763574d3fd.tar.gz
runtime: set CL_KERNEL_PREFERRED_WORK_GROUP_SIZE_MULTIPLE to kernel's SIMD_WIDTH.
It makes sense to set CL_KERNEL_PREFERRED_WORK_GROUP_SIZE_MULTIPLE to the corresponding SIMD size. Then it provides a way for intel's OCL application to get SIMD width at runtime and make some SIMD width dependant optimization possible. Signed-off-by: Zhigang Gong <zhigang.gong@intel.com> Reviewed-by: Ruiling Song <ruiling.song@intel.com>
Diffstat (limited to 'src/cl_api.c')
-rw-r--r--src/cl_api.c3
1 files changed, 2 insertions, 1 deletions
diff --git a/src/cl_api.c b/src/cl_api.c
index ddd39cfc..d8ccd7e4 100644
--- a/src/cl_api.c
+++ b/src/cl_api.c
@@ -3022,6 +3022,7 @@ clEnqueueNDRangeKernel(cl_command_queue command_queue,
err = cl_command_queue_flush(command_queue);
}
+error:
if(b_output_kernel_perf)
{
if(kernel->program->build_opts != NULL)
@@ -3029,7 +3030,7 @@ clEnqueueNDRangeKernel(cl_command_queue command_queue,
else
time_end(command_queue->ctx, cl_kernel_get_name(kernel), "", command_queue);
}
-error:
+
return err;
}