diff options
author | Grigori Goronzy <[email protected]> | 2015-05-28 13:01:51 +0200 |
---|---|---|
committer | Grigori Goronzy <[email protected]> | 2015-06-29 13:24:37 +0200 |
commit | d15b32ebded278243eb648bb9ecd4c5f5d6d0569 (patch) | |
tree | 5f9f347641e1a5751f5a463a723d67a8d450d7a3 /src/gallium/state_trackers/clover | |
parent | 249a9df7fce0a6bebc70852ab583c5324208bf06 (diff) |
clover: implement CL_KERNEL_PREFERRED_WORK_GROUP_SIZE_MULTIPLE
Work-group size should always be aligned to subgroup size; this is a
basic requirement, otherwise some work-items will be no-operation.
It might make sense to refine the value according to a kernel's
resource usage, but that's a possible optimization for the future.
Reviewed-by: Francisco Jerez <[email protected]>
Diffstat (limited to 'src/gallium/state_trackers/clover')
-rw-r--r-- | src/gallium/state_trackers/clover/api/kernel.cpp | 2 | ||||
-rw-r--r-- | src/gallium/state_trackers/clover/core/device.cpp | 5 | ||||
-rw-r--r-- | src/gallium/state_trackers/clover/core/device.hpp | 1 |
3 files changed, 7 insertions, 1 deletions
diff --git a/src/gallium/state_trackers/clover/api/kernel.cpp b/src/gallium/state_trackers/clover/api/kernel.cpp index 05cc392a914..857a152b554 100644 --- a/src/gallium/state_trackers/clover/api/kernel.cpp +++ b/src/gallium/state_trackers/clover/api/kernel.cpp @@ -169,7 +169,7 @@ clGetKernelWorkGroupInfo(cl_kernel d_kern, cl_device_id d_dev, break; case CL_KERNEL_PREFERRED_WORK_GROUP_SIZE_MULTIPLE: - buf.as_scalar<size_t>() = 1; + buf.as_scalar<size_t>() = dev.subgroup_size(); break; case CL_KERNEL_PRIVATE_MEM_SIZE: diff --git a/src/gallium/state_trackers/clover/core/device.cpp b/src/gallium/state_trackers/clover/core/device.cpp index 42b45b7f2b8..c42d1d26004 100644 --- a/src/gallium/state_trackers/clover/core/device.cpp +++ b/src/gallium/state_trackers/clover/core/device.cpp @@ -185,6 +185,11 @@ device::max_block_size() const { return { v.begin(), v.end() }; } +cl_uint +device::subgroup_size() const { + return get_compute_param<uint32_t>(pipe, PIPE_COMPUTE_CAP_SUBGROUP_SIZE)[0]; +} + std::string device::device_name() const { return pipe->get_name(pipe); diff --git a/src/gallium/state_trackers/clover/core/device.hpp b/src/gallium/state_trackers/clover/core/device.hpp index de5fc6bb9c4..285784744f3 100644 --- a/src/gallium/state_trackers/clover/core/device.hpp +++ b/src/gallium/state_trackers/clover/core/device.hpp @@ -67,6 +67,7 @@ namespace clover { bool has_doubles() const; std::vector<size_t> max_block_size() const; + cl_uint subgroup_size() const; std::string device_name() const; std::string vendor_name() const; enum pipe_shader_ir ir_format() const; |