summaryrefslogtreecommitdiff
path: root/src/cl_command_queue_gen7.c
diff options
context:
space:
mode:
authorRuiling Song <ruiling.song@intel.com>2013-08-05 15:14:39 +0800
committerZhigang Gong <zhigang.gong@linux.intel.com>2013-08-06 15:09:58 +0800
commitae356f884dbfde6b7b38f7afa25669b8e8a6865c (patch)
tree9f059466a64c86aa726ca6b660c3c516c83217fe /src/cl_command_queue_gen7.c
parente01efd4d19a91a7d6bfce5659757d00608aa90d5 (diff)
downloadbeignet-ae356f884dbfde6b7b38f7afa25669b8e8a6865c.tar.gz
Fix a bug in stack calculation.
1. the thread_id is located in r0.5[0-8], so we need to get the correct bits. 2. also, we don't need so much stack size, max_compute_unit have already been treated as: #EU * max_thread_per_eu. Signed-off-by: Ruiling Song <ruiling.song@intel.com> Reviewed-by: Xing, Homer <homer.xing@intel.com> Reviewed-by: Zhigang Gong <zhigang.gong@linux.intel.com>
Diffstat (limited to 'src/cl_command_queue_gen7.c')
-rw-r--r--src/cl_command_queue_gen7.c1
1 files changed, 0 insertions, 1 deletions
diff --git a/src/cl_command_queue_gen7.c b/src/cl_command_queue_gen7.c
index 048595cf..89332139 100644
--- a/src/cl_command_queue_gen7.c
+++ b/src/cl_command_queue_gen7.c
@@ -180,7 +180,6 @@ cl_bind_stack(cl_gpgpu gpgpu, cl_kernel ker)
assert(offset >= 0);
stack_sz *= gbe_kernel_get_simd_width(ker->opaque);
stack_sz *= device->max_compute_unit;
- stack_sz *= device->max_thread_per_unit;
cl_gpgpu_set_stack(gpgpu, offset, stack_sz, cc_llc_l3);
}