summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorSamuel Pitoiset <[email protected]>2017-12-14 13:51:47 +0100
committerSamuel Pitoiset <[email protected]>2017-12-14 22:23:28 +0100
commit88522e2bcd0e65ca619204f0eec96864323b94cb (patch)
treedcd0fcf97122301e42c0ca0ff08e251e72fd1f1b
parent45872a0a6d99d3f7704d9539f215eb0004c1e576 (diff)
radv: export SampleMask from pixel shaders at full rate
Use 16_ABGR instead of 32_ABGR if Z isn't written. Ported from RadeonSI. No CTS regressions on Polaris. Signed-off-by: Samuel Pitoiset <[email protected]> Reviewed-by: Bas Nieuwenhuizen <[email protected]>
-rw-r--r--src/amd/common/ac_nir_to_llvm.c46
-rw-r--r--src/amd/vulkan/radv_pipeline.c11
2 files changed, 41 insertions, 16 deletions
diff --git a/src/amd/common/ac_nir_to_llvm.c b/src/amd/common/ac_nir_to_llvm.c
index 2fe346b012e..63803f14644 100644
--- a/src/amd/common/ac_nir_to_llvm.c
+++ b/src/amd/common/ac_nir_to_llvm.c
@@ -32,6 +32,7 @@
#include <llvm-c/Transforms/Scalar.h>
#include "ac_shader_abi.h"
#include "ac_shader_info.h"
+#include "ac_shader_util.h"
#include "ac_exp_param.h"
enum radeon_llvm_calling_convention {
@@ -6211,19 +6212,42 @@ si_export_mrt_z(struct nir_to_llvm_context *ctx,
args.out[2] = LLVMGetUndef(ctx->ac.f32); /* B, sample mask */
args.out[3] = LLVMGetUndef(ctx->ac.f32); /* A, alpha to mask */
- if (depth) {
- args.out[0] = depth;
- args.enabled_channels |= 0x1;
- }
+ unsigned format = ac_get_spi_shader_z_format(depth != NULL,
+ stencil != NULL,
+ samplemask != NULL);
+
+ if (format == V_028710_SPI_SHADER_UINT16_ABGR) {
+ assert(!depth);
+ args.compr = 1; /* COMPR flag */
+
+ if (stencil) {
+ /* Stencil should be in X[23:16]. */
+ stencil = ac_to_integer(&ctx->ac, stencil);
+ stencil = LLVMBuildShl(ctx->builder, stencil,
+ LLVMConstInt(ctx->ac.i32, 16, 0), "");
+ args.out[0] = ac_to_float(&ctx->ac, stencil);
+ args.enabled_channels |= 0x3;
+ }
+ if (samplemask) {
+ /* SampleMask should be in Y[15:0]. */
+ args.out[1] = samplemask;
+ args.enabled_channels |= 0xc;
+ }
+ } else {
+ if (depth) {
+ args.out[0] = depth;
+ args.enabled_channels |= 0x1;
+ }
- if (stencil) {
- args.out[1] = stencil;
- args.enabled_channels |= 0x2;
- }
+ if (stencil) {
+ args.out[1] = stencil;
+ args.enabled_channels |= 0x2;
+ }
- if (samplemask) {
- args.out[2] = samplemask;
- args.enabled_channels |= 0x4;
+ if (samplemask) {
+ args.out[2] = samplemask;
+ args.enabled_channels |= 0x4;
+ }
}
/* SI (except OLAND and HAINAN) has a bug that it only looks
diff --git a/src/amd/vulkan/radv_pipeline.c b/src/amd/vulkan/radv_pipeline.c
index 0146d6935e0..1ada69d92f8 100644
--- a/src/amd/vulkan/radv_pipeline.c
+++ b/src/amd/vulkan/radv_pipeline.c
@@ -46,6 +46,7 @@
#include "vk_format.h"
#include "util/debug.h"
#include "ac_exp_param.h"
+#include "ac_shader_util.h"
static void
radv_pipeline_destroy(struct radv_device *device,
@@ -2108,11 +2109,11 @@ radv_pipeline_init(struct radv_pipeline *pipeline,
if (pipeline->device->physical_device->has_rbplus)
pipeline->graphics.db_shader_control |= S_02880C_DUAL_QUAD_DISABLE(1);
- pipeline->graphics.shader_z_format =
- ps->info.fs.writes_sample_mask ? V_028710_SPI_SHADER_32_ABGR :
- ps->info.fs.writes_stencil ? V_028710_SPI_SHADER_32_GR :
- ps->info.fs.writes_z ? V_028710_SPI_SHADER_32_R :
- V_028710_SPI_SHADER_ZERO;
+ unsigned shader_z_format =
+ ac_get_spi_shader_z_format(ps->info.fs.writes_z,
+ ps->info.fs.writes_stencil,
+ ps->info.fs.writes_sample_mask);
+ pipeline->graphics.shader_z_format = shader_z_format;
calculate_vgt_gs_mode(pipeline);
calculate_vs_outinfo(pipeline);