diff options
Diffstat (limited to 'src/intel')
-rw-r--r-- | src/intel/compiler/brw_fs_cmod_propagation.cpp | 10 |
1 files changed, 9 insertions, 1 deletions
diff --git a/src/intel/compiler/brw_fs_cmod_propagation.cpp b/src/intel/compiler/brw_fs_cmod_propagation.cpp index 5b74f267359..5fb522f810f 100644 --- a/src/intel/compiler/brw_fs_cmod_propagation.cpp +++ b/src/intel/compiler/brw_fs_cmod_propagation.cpp @@ -211,9 +211,17 @@ opt_cmod_propagation_local(const gen_device_info *devinfo, bblock_t *block) /* A CMP with a second source of zero can match with anything. A CMP * with a second source that is not zero can only match with an ADD * instruction. + * + * Only apply this optimization to float-point sources. It can fail for + * integers. For inputs a = 0x80000000, b = 4, int(0x80000000) < 4, but + * int(0x80000000) - 4 overflows and results in 0x7ffffffc. that's not + * less than zero, so the flags get set differently than for (a < b). */ if (inst->opcode == BRW_OPCODE_CMP && !inst->src[1].is_zero()) { - progress = cmod_propagate_cmp_to_add(devinfo, block, inst) || progress; + if (brw_reg_type_is_floating_point(inst->src[0].type) && + cmod_propagate_cmp_to_add(devinfo, block, inst)) + progress = true; + continue; } |