summaryrefslogtreecommitdiffstats
path: root/src/gallium/drivers/r300/compiler
diff options
context:
space:
mode:
authorTom Stellard <[email protected]>2011-10-01 15:22:24 -0700
committerTom Stellard <[email protected]>2011-10-02 15:21:15 -0700
commitd64c6d2ffc086bde7a025269b80c0980f7d908f1 (patch)
tree1217548ef93e5e16d0562d6097ed8a331d0c0093 /src/gallium/drivers/r300/compiler
parent13814b0103812adbb5aba0dba4664249e8566290 (diff)
r300/compiler: Fix error in OMOD optimization
Classic compiler mistake. In the example below, the OMOD optimization was combining instructions 4 and 10, but since there was an instruction (#8) in between them that wrote to the same registers as instruction 10, instruction 11 was reading the wrong value. Example of the mistake: Before OMOD: 4: MAD temp[0].y, temp[3]._y__, const[0]._x__, const[0]._y__; ... 8: ADD temp[2].x, temp[1].x___, -temp[4].x___; ... 10: MUL temp[2].x, const[1].y___, temp[0].y___; 11: FRC temp[5].x, temp[2].x___; After OMOD: 4: MAD temp[2].x / 8, temp[3]._y__, const[0]._x__, const[0]._y__; ... 8: ADD temp[2].x, temp[1].x___, -temp[4].x___; ... 11: FRC temp[5].x, temp[2].x___; https://bugs.freedesktop.org/show_bug.cgi?id=41367
Diffstat (limited to 'src/gallium/drivers/r300/compiler')
-rw-r--r--src/gallium/drivers/r300/compiler/radeon_optimize.c16
1 files changed, 16 insertions, 0 deletions
diff --git a/src/gallium/drivers/r300/compiler/radeon_optimize.c b/src/gallium/drivers/r300/compiler/radeon_optimize.c
index b7a0e20797c..2d799a6547a 100644
--- a/src/gallium/drivers/r300/compiler/radeon_optimize.c
+++ b/src/gallium/drivers/r300/compiler/radeon_optimize.c
@@ -681,6 +681,20 @@ static void omod_filter_reader_cb(
}
}
+static void omod_filter_writer_cb(
+ void * userdata,
+ struct rc_instruction * inst,
+ rc_register_file file,
+ unsigned int index,
+ unsigned int mask)
+{
+ struct peephole_mul_cb_data * d = userdata;
+ if (file == d->Writer->File && index == d->Writer->Index &&
+ (mask & d->Writer->WriteMask)) {
+ d->Clobbered = 1;
+ }
+}
+
static int peephole_mul_omod(
struct radeon_compiler * c,
struct rc_instruction * inst_mul,
@@ -788,6 +802,8 @@ static int peephole_mul_omod(
inst = inst->Prev) {
rc_for_all_reads_mask(inst, omod_filter_reader_cb,
&cb_data);
+ rc_for_all_writes_mask(inst, omod_filter_writer_cb,
+ &cb_data);
if (cb_data.Clobbered) {
break;
}