From 6318808a0559f7b2a8152592f0ae4e5ccc6953a9 Mon Sep 17 00:00:00 2001 From: Iago Toral Quiroga <itoral@igalia.com> Date: Thu, 19 Apr 2018 10:06:43 +0200 Subject: intel/compiler: fix 16-bit comparisons NIR assumes that booleans are always 32-bit, but Intel hardware produces 16-bit booleans for 16-bit comparisons. This means that we need to convert the 16-bit result to 32-bit. In the future we want to add an optimization pass to clean this up and hopefully remove the conversions. v2 (Jason): use the type of the source for the temporary and use brw_reg_type_from_bit_size for the conversion to 32-bit. Reviewed-by: Jason Ekstrand <jason@jlekstrand.net> --- src/intel/compiler/brw_fs_nir.cpp | 38 ++++++++++++++++++++++++++++++-------- 1 file changed, 30 insertions(+), 8 deletions(-) (limited to 'src/intel/compiler') diff --git a/src/intel/compiler/brw_fs_nir.cpp b/src/intel/compiler/brw_fs_nir.cpp index 5f8f7cd6a66..9c802fb7c62 100644 --- a/src/intel/compiler/brw_fs_nir.cpp +++ b/src/intel/compiler/brw_fs_nir.cpp @@ -1018,9 +1018,11 @@ fs_visitor::nir_emit_alu(const fs_builder &bld, nir_alu_instr *instr) case nir_op_feq: case nir_op_fne: { fs_reg dest = result; - if (nir_src_bit_size(instr->src[0].src) > 32) { - dest = bld.vgrf(BRW_REGISTER_TYPE_DF, 1); - } + + const uint32_t bit_size = nir_src_bit_size(instr->src[0].src); + if (bit_size != 32) + dest = bld.vgrf(op[0].type, 1); + brw_conditional_mod cond; switch (instr->op) { case nir_op_flt: @@ -1038,9 +1040,19 @@ fs_visitor::nir_emit_alu(const fs_builder &bld, nir_alu_instr *instr) default: unreachable("bad opcode"); } + bld.CMP(dest, op[0], op[1], cond); - if (nir_src_bit_size(instr->src[0].src) > 32) { + + if (bit_size > 32) { bld.MOV(result, subscript(dest, BRW_REGISTER_TYPE_UD, 0)); + } else if(bit_size < 32) { + /* When we convert the result to 32-bit we need to be careful and do + * it as a signed conversion to get sign extension (for 32-bit true) + */ + const brw_reg_type src_type = + brw_reg_type_from_bit_size(bit_size, BRW_REGISTER_TYPE_D); + + bld.MOV(retype(result, BRW_REGISTER_TYPE_D), retype(dest, src_type)); } break; } @@ -1052,9 +1064,10 @@ fs_visitor::nir_emit_alu(const fs_builder &bld, nir_alu_instr *instr) case nir_op_ieq: case nir_op_ine: { fs_reg dest = result; - if (nir_src_bit_size(instr->src[0].src) > 32) { - dest = bld.vgrf(BRW_REGISTER_TYPE_UQ, 1); - } + + const uint32_t bit_size = nir_src_bit_size(instr->src[0].src); + if (bit_size != 32) + dest = bld.vgrf(op[0].type, 1); brw_conditional_mod cond; switch (instr->op) { @@ -1076,8 +1089,17 @@ fs_visitor::nir_emit_alu(const fs_builder &bld, nir_alu_instr *instr) unreachable("bad opcode"); } bld.CMP(dest, op[0], op[1], cond); - if (nir_src_bit_size(instr->src[0].src) > 32) { + + if (bit_size > 32) { bld.MOV(result, subscript(dest, BRW_REGISTER_TYPE_UD, 0)); + } else if (bit_size < 32) { + /* When we convert the result to 32-bit we need to be careful and do + * it as a signed conversion to get sign extension (for 32-bit true) + */ + const brw_reg_type src_type = + brw_reg_type_from_bit_size(bit_size, BRW_REGISTER_TYPE_D); + + bld.MOV(retype(result, BRW_REGISTER_TYPE_D), retype(dest, src_type)); } break; } -- cgit v1.2.3