diff options
author | Jason Ekstrand <[email protected]> | 2014-08-13 12:23:47 -0700 |
---|---|---|
committer | Jason Ekstrand <[email protected]> | 2014-09-30 10:29:14 -0700 |
commit | f91b566f55390d1a0e472ac970d017374b91ee83 (patch) | |
tree | 03e15652cc5dc714ebf6c0b1ffc2f546d8263079 /src/mesa | |
parent | 1728e74957a62b1b4b9fbb62a7de2c12b77c8a75 (diff) |
i965/brw_reg: Add a firsthalf function and use it in the generator
Right now, this function is a no-op but it indicates that we intend to only
use the first half of the 16-wide register.
Signed-off-by: Jason Ekstrand <[email protected]>
Reviewed-by: Matt Turner <[email protected]>
Diffstat (limited to 'src/mesa')
-rw-r--r-- | src/mesa/drivers/dri/i965/brw_fs_generator.cpp | 67 | ||||
-rw-r--r-- | src/mesa/drivers/dri/i965/brw_reg.h | 6 |
2 files changed, 44 insertions, 29 deletions
diff --git a/src/mesa/drivers/dri/i965/brw_fs_generator.cpp b/src/mesa/drivers/dri/i965/brw_fs_generator.cpp index 6ba9c0edf6c..122a43f9316 100644 --- a/src/mesa/drivers/dri/i965/brw_fs_generator.cpp +++ b/src/mesa/drivers/dri/i965/brw_fs_generator.cpp @@ -318,10 +318,11 @@ fs_generator::generate_math_gen6(fs_inst *inst, int op = brw_math_function(inst->opcode); bool binop = src1.file != BRW_ARCHITECTURE_REGISTER_FILE; - brw_set_default_compression_control(p, BRW_COMPRESSION_NONE); - gen6_math(p, dst, op, src0, src1); - - if (dispatch_width == 16) { + if (dispatch_width == 8) { + gen6_math(p, dst, op, src0, src1); + } else if (dispatch_width == 16) { + brw_set_default_compression_control(p, BRW_COMPRESSION_NONE); + gen6_math(p, firsthalf(dst), op, firsthalf(src0), firsthalf(src1)); brw_set_default_compression_control(p, BRW_COMPRESSION_2NDHALF); gen6_math(p, sechalf(dst), op, sechalf(src0), binop ? sechalf(src1) : brw_null_reg()); @@ -338,13 +339,17 @@ fs_generator::generate_math_gen4(fs_inst *inst, assert(inst->mlen >= 1); - brw_set_default_compression_control(p, BRW_COMPRESSION_NONE); - gen4_math(p, dst, - op, - inst->base_mrf, src, - BRW_MATH_PRECISION_FULL); - - if (dispatch_width == 16) { + if (dispatch_width == 8) { + gen4_math(p, dst, + op, + inst->base_mrf, src, + BRW_MATH_PRECISION_FULL); + } else if (dispatch_width == 16) { + brw_set_default_compression_control(p, BRW_COMPRESSION_NONE); + gen4_math(p, firsthalf(dst), + op, + inst->base_mrf, firsthalf(src), + BRW_MATH_PRECISION_FULL); brw_set_default_compression_control(p, BRW_COMPRESSION_2NDHALF); gen4_math(p, sechalf(dst), op, @@ -787,17 +792,18 @@ fs_generator::generate_ddy(fs_inst *inst, struct brw_reg dst, struct brw_reg src BRW_SWIZZLE_ZWZW, WRITEMASK_XYZW); brw_push_insn_state(p); brw_set_default_access_mode(p, BRW_ALIGN_16); - if (unroll_to_simd8) - brw_set_default_compression_control(p, BRW_COMPRESSION_NONE); - if (negate_value) - brw_ADD(p, dst, src1, negate(src0)); - else - brw_ADD(p, dst, src0, negate(src1)); if (unroll_to_simd8) { - brw_set_default_compression_control(p, BRW_COMPRESSION_2NDHALF); - src0 = sechalf(src0); - src1 = sechalf(src1); - dst = sechalf(dst); + brw_set_default_compression_control(p, BRW_COMPRESSION_NONE); + if (negate_value) { + brw_ADD(p, firsthalf(dst), firsthalf(src1), negate(firsthalf(src0))); + brw_set_default_compression_control(p, BRW_COMPRESSION_2NDHALF); + brw_ADD(p, sechalf(dst), sechalf(src1), negate(sechalf(src0))); + } else { + brw_ADD(p, firsthalf(dst), firsthalf(src0), negate(firsthalf(src1))); + brw_set_default_compression_control(p, BRW_COMPRESSION_2NDHALF); + brw_ADD(p, sechalf(dst), sechalf(src0), negate(sechalf(src1))); + } + } else { if (negate_value) brw_ADD(p, dst, src1, negate(src0)); else @@ -1327,9 +1333,12 @@ fs_generator::generate_set_sample_id(fs_inst *inst, brw_set_default_compression_control(p, BRW_COMPRESSION_NONE); brw_set_default_mask_control(p, BRW_MASK_DISABLE); struct brw_reg reg = retype(stride(src1, 1, 4, 0), BRW_REGISTER_TYPE_UW); - brw_ADD(p, dst, src0, reg); - if (dispatch_width == 16) - brw_ADD(p, offset(dst, 1), offset(src0, 1), suboffset(reg, 2)); + if (dispatch_width == 8) { + brw_ADD(p, dst, src0, reg); + } else if (dispatch_width == 16) { + brw_ADD(p, firsthalf(dst), firsthalf(src0), reg); + brw_ADD(p, sechalf(dst), sechalf(src0), suboffset(reg, 2)); + } brw_pop_insn_state(p); } @@ -1560,7 +1569,7 @@ fs_generator::generate_code(const cfg_t *cfg) brw_set_default_access_mode(p, BRW_ALIGN_16); if (dispatch_width == 16 && brw->gen < 8 && !brw->is_haswell) { brw_set_default_compression_control(p, BRW_COMPRESSION_NONE); - brw_MAD(p, dst, src[0], src[1], src[2]); + brw_MAD(p, firsthalf(dst), firsthalf(src[0]), firsthalf(src[1]), firsthalf(src[2])); brw_set_default_compression_control(p, BRW_COMPRESSION_2NDHALF); brw_MAD(p, sechalf(dst), sechalf(src[0]), sechalf(src[1]), sechalf(src[2])); brw_set_default_compression_control(p, BRW_COMPRESSION_COMPRESSED); @@ -1575,7 +1584,7 @@ fs_generator::generate_code(const cfg_t *cfg) brw_set_default_access_mode(p, BRW_ALIGN_16); if (dispatch_width == 16 && brw->gen < 8 && !brw->is_haswell) { brw_set_default_compression_control(p, BRW_COMPRESSION_NONE); - brw_LRP(p, dst, src[0], src[1], src[2]); + brw_LRP(p, firsthalf(dst), firsthalf(src[0]), firsthalf(src[1]), firsthalf(src[2])); brw_set_default_compression_control(p, BRW_COMPRESSION_2NDHALF); brw_LRP(p, sechalf(dst), sechalf(src[0]), sechalf(src[1]), sechalf(src[2])); brw_set_default_compression_control(p, BRW_COMPRESSION_COMPRESSED); @@ -1671,7 +1680,7 @@ fs_generator::generate_code(const cfg_t *cfg) brw_set_default_access_mode(p, BRW_ALIGN_16); if (dispatch_width == 16 && brw->gen < 8 && !brw->is_haswell) { brw_set_default_compression_control(p, BRW_COMPRESSION_NONE); - brw_BFE(p, dst, src[0], src[1], src[2]); + brw_BFE(p, firsthalf(dst), firsthalf(src[0]), firsthalf(src[1]), firsthalf(src[2])); brw_set_default_compression_control(p, BRW_COMPRESSION_2NDHALF); brw_BFE(p, sechalf(dst), sechalf(src[0]), sechalf(src[1]), sechalf(src[2])); brw_set_default_compression_control(p, BRW_COMPRESSION_COMPRESSED); @@ -1690,7 +1699,7 @@ fs_generator::generate_code(const cfg_t *cfg) */ if (dispatch_width == 16 && brw->is_haswell) { brw_set_default_compression_control(p, BRW_COMPRESSION_NONE); - brw_BFI1(p, dst, src[0], src[1]); + brw_BFI1(p, firsthalf(dst), firsthalf(src[0]), firsthalf(src[1])); brw_set_default_compression_control(p, BRW_COMPRESSION_2NDHALF); brw_BFI1(p, sechalf(dst), sechalf(src[0]), sechalf(src[1])); brw_set_default_compression_control(p, BRW_COMPRESSION_COMPRESSED); @@ -1711,7 +1720,7 @@ fs_generator::generate_code(const cfg_t *cfg) */ if (dispatch_width == 16) { brw_set_default_compression_control(p, BRW_COMPRESSION_NONE); - brw_BFI2(p, dst, src[0], src[1], src[2]); + brw_BFI2(p, firsthalf(dst), firsthalf(src[0]), firsthalf(src[1]), firsthalf(src[2])); brw_set_default_compression_control(p, BRW_COMPRESSION_2NDHALF); brw_BFI2(p, sechalf(dst), sechalf(src[0]), sechalf(src[1]), sechalf(src[2])); brw_set_default_compression_control(p, BRW_COMPRESSION_COMPRESSED); diff --git a/src/mesa/drivers/dri/i965/brw_reg.h b/src/mesa/drivers/dri/i965/brw_reg.h index 9638c779f91..2e110d6b90d 100644 --- a/src/mesa/drivers/dri/i965/brw_reg.h +++ b/src/mesa/drivers/dri/i965/brw_reg.h @@ -371,6 +371,12 @@ retype(struct brw_reg reg, enum brw_reg_type type) } static inline struct brw_reg +firsthalf(struct brw_reg reg) +{ + return reg; +} + +static inline struct brw_reg sechalf(struct brw_reg reg) { if (reg.vstride) |