summaryrefslogtreecommitdiffstats
path: root/src
diff options
context:
space:
mode:
authorKristian Høgsberg Kristensen <[email protected]>2015-06-12 17:21:01 -0700
committerKristian Høgsberg Kristensen <[email protected]>2015-06-12 18:21:50 -0700
commitfa8a07748d96525b208146065b5264821a9ef338 (patch)
treec50f03f08be45341f5f32f0da521e92192d7e9ca /src
parentc103c4990c9a647891ed3ee1667c129ee3e16996 (diff)
vk: Compute CS exec mask and thread width max in pipeline
We compute the right mask and thread width max parameters as part of pipeline creation and set them accordingly at vkCmdDispatch() and vkCmdDispatchIndirect() time. These parameters depend only on the local group size and the dispatch width of the program so we can figure this out at pipeline create time.
Diffstat (limited to 'src')
-rw-r--r--src/vulkan/device.c42
-rw-r--r--src/vulkan/pipeline.c12
-rw-r--r--src/vulkan/private.h3
3 files changed, 25 insertions, 32 deletions
diff --git a/src/vulkan/device.c b/src/vulkan/device.c
index 0126b248233..e55e66fd74f 100644
--- a/src/vulkan/device.c
+++ b/src/vulkan/device.c
@@ -3390,31 +3390,20 @@ void anv_CmdDispatch(
uint32_t z)
{
struct anv_cmd_buffer *cmd_buffer = (struct anv_cmd_buffer *) cmdBuffer;
- uint32_t size = SIMD8; /* FIXME */
- uint32_t right_mask = 0; /* FIXME */
- uint32_t thread_width_max = 0; /* FIXME */
+ struct anv_pipeline *pipeline = cmd_buffer->compute_pipeline;
+ struct brw_cs_prog_data *prog_data = &pipeline->cs_prog_data;
anv_cmd_buffer_flush_compute_state(cmd_buffer);
anv_batch_emit(&cmd_buffer->batch, GEN8_GPGPU_WALKER,
-
- .InterfaceDescriptorOffset = 0,
- .IndirectDataLength = 0,
- .IndirectDataStartAddress = 0,
-
- .SIMDSize = size,
-
+ .SIMDSize = prog_data->simd_size / 16,
.ThreadDepthCounterMaximum = 0,
.ThreadHeightCounterMaximum = 0,
- .ThreadWidthCounterMaximum = thread_width_max,
-
- .ThreadGroupIDStartingX = 0,
+ .ThreadWidthCounterMaximum = pipeline->cs_thread_width_max,
.ThreadGroupIDXDimension = x,
- .ThreadGroupIDStartingY = 0,
.ThreadGroupIDYDimension = y,
- .ThreadGroupIDStartingResumeZ = 0,
.ThreadGroupIDZDimension = z,
- .RightExecutionMask = right_mask,
+ .RightExecutionMask = pipeline->cs_right_mask,
.BottomExecutionMask = 0xffffffff);
anv_batch_emit(&cmd_buffer->batch, GEN8_MEDIA_STATE_FLUSH);
@@ -3430,6 +3419,8 @@ void anv_CmdDispatchIndirect(
VkDeviceSize offset)
{
struct anv_cmd_buffer *cmd_buffer = (struct anv_cmd_buffer *) cmdBuffer;
+ struct anv_pipeline *pipeline = cmd_buffer->compute_pipeline;
+ struct brw_cs_prog_data *prog_data = &pipeline->cs_prog_data;
struct anv_buffer *buffer = (struct anv_buffer *) _buffer;
struct anv_bo *bo = buffer->bo;
uint32_t bo_offset = buffer->offset + offset;
@@ -3440,26 +3431,13 @@ void anv_CmdDispatchIndirect(
anv_batch_lrm(&cmd_buffer->batch, GPGPU_DISPATCHDIMY, bo, bo_offset + 4);
anv_batch_lrm(&cmd_buffer->batch, GPGPU_DISPATCHDIMZ, bo, bo_offset + 8);
- uint32_t size = SIMD8; /* FIXME */
- uint32_t right_mask = 0; /* FIXME */
- uint32_t thread_width_max = 0; /* FIXME */
-
- /* FIXME: We can't compute thread_width_max for indirect, looks like it
- * depends on DIMX. */
-
anv_batch_emit(&cmd_buffer->batch, GEN8_GPGPU_WALKER,
.IndirectParameterEnable = true,
- .InterfaceDescriptorOffset = 0,
- .IndirectDataLength = 0,
- .IndirectDataStartAddress = 0,
-
- .SIMDSize = size,
-
+ .SIMDSize = prog_data->simd_size / 16,
.ThreadDepthCounterMaximum = 0,
.ThreadHeightCounterMaximum = 0,
- .ThreadWidthCounterMaximum = thread_width_max,
-
- .RightExecutionMask = right_mask,
+ .ThreadWidthCounterMaximum = pipeline->cs_thread_width_max,
+ .RightExecutionMask = pipeline->cs_right_mask,
.BottomExecutionMask = 0xffffffff);
anv_batch_emit(&cmd_buffer->batch, GEN8_MEDIA_STATE_FLUSH);
diff --git a/src/vulkan/pipeline.c b/src/vulkan/pipeline.c
index cf7562ae496..aa24ad43004 100644
--- a/src/vulkan/pipeline.c
+++ b/src/vulkan/pipeline.c
@@ -770,6 +770,18 @@ VkResult anv_CreateComputePipeline(
.URBEntryAllocationSize = 2,
.CURBEAllocationSize = 0);
+ struct brw_cs_prog_data *prog_data = &pipeline->cs_prog_data;
+ uint32_t group_size = prog_data->local_size[0] *
+ prog_data->local_size[1] * prog_data->local_size[2];
+ pipeline->cs_thread_width_max = DIV_ROUND_UP(group_size, prog_data->simd_size);
+ uint32_t remainder = group_size & (prog_data->simd_size - 1);
+
+ if (remainder > 0)
+ pipeline->cs_right_mask = ~0u >> (32 - remainder);
+ else
+ pipeline->cs_right_mask = ~0u >> (32 - prog_data->simd_size);
+
+
*pPipeline = (VkPipeline) pipeline;
return VK_SUCCESS;
diff --git a/src/vulkan/private.h b/src/vulkan/private.h
index cf1cf4c1268..08dea1526e8 100644
--- a/src/vulkan/private.h
+++ b/src/vulkan/private.h
@@ -726,6 +726,9 @@ struct anv_pipeline {
uint32_t state_sf[GEN8_3DSTATE_SF_length];
uint32_t state_raster[GEN8_3DSTATE_RASTER_length];
uint32_t state_wm_depth_stencil[GEN8_3DSTATE_WM_DEPTH_STENCIL_length];
+
+ uint32_t cs_thread_width_max;
+ uint32_t cs_right_mask;
};
struct anv_pipeline_create_info {