summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorFrancisco Jerez <[email protected]>2016-09-01 19:47:56 -0700
committerFrancisco Jerez <[email protected]>2016-09-14 14:50:57 -0700
commit645261c4b2a12b5724946f9f6d35f74e28ce760f (patch)
tree84f3a5d353acaa30e5d7c3421b8cf33ffe9e709c
parent1c67e272475f576c8ab4b2be367f4c3c664cb23c (diff)
i965/fs: Change region_contained_in() to use byte units.
This makes the function less annoying to use and more accurate -- We shouldn't propagate a copy into a register region that wasn't fully contained in the destination of the copy (IOW, a source region that wasn't fully defined by the copy) just because the number of registers written and read by each instruction happened to get rounded up to the same GRF multiple. Reviewed-by: Iago Toral Quiroga <[email protected]>
-rw-r--r--src/mesa/drivers/dri/i965/brw_fs_copy_propagation.cpp25
1 files changed, 10 insertions, 15 deletions
diff --git a/src/mesa/drivers/dri/i965/brw_fs_copy_propagation.cpp b/src/mesa/drivers/dri/i965/brw_fs_copy_propagation.cpp
index 0da5f13014f..80ad4b4adc6 100644
--- a/src/mesa/drivers/dri/i965/brw_fs_copy_propagation.cpp
+++ b/src/mesa/drivers/dri/i965/brw_fs_copy_propagation.cpp
@@ -333,18 +333,17 @@ can_take_stride(fs_inst *inst, unsigned arg, unsigned stride,
}
/**
- * Check that the register region read by src [src.reg_offset,
- * src.reg_offset + regs_read] is contained inside the register
- * region written by dst [dst.reg_offset, dst.reg_offset + regs_written]
- * Both src and dst must have the same register number and file.
+ * Check that the register region read by src [src.offset,
+ * src.offset + size_read[ is fully contained inside the register
+ * region written by dst [dst.offset, dst.offset + size_written[.
*/
static inline bool
-region_contained_in(const fs_reg &src, unsigned regs_read,
- const fs_reg &dst, unsigned regs_written)
+region_contained_in(const fs_reg &src, unsigned size_read,
+ const fs_reg &dst, unsigned size_written)
{
return src.file == dst.file && src.nr == dst.nr &&
src.offset >= dst.offset &&
- src.offset / REG_SIZE + regs_read <= dst.offset / REG_SIZE + regs_written;
+ src.offset + size_read <= dst.offset + size_written;
}
bool
@@ -369,10 +368,8 @@ fs_visitor::try_copy_propagate(fs_inst *inst, int arg, acp_entry *entry)
/* Bail if inst is reading a range that isn't contained in the range
* that entry is writing.
*/
- if (!region_contained_in(inst->src[arg], DIV_ROUND_UP(inst->size_read(arg),
- REG_SIZE),
- entry->dst, DIV_ROUND_UP(entry->size_written,
- REG_SIZE)))
+ if (!region_contained_in(inst->src[arg], inst->size_read(arg),
+ entry->dst, entry->size_written))
return false;
/* we can't generally copy-propagate UD negations because we
@@ -527,10 +524,8 @@ fs_visitor::try_constant_propagate(fs_inst *inst, acp_entry *entry)
/* Bail if inst is reading a range that isn't contained in the range
* that entry is writing.
*/
- if (!region_contained_in(inst->src[i], DIV_ROUND_UP(inst->size_read(i),
- REG_SIZE),
- entry->dst, DIV_ROUND_UP(entry->size_written,
- REG_SIZE)))
+ if (!region_contained_in(inst->src[i], inst->size_read(i),
+ entry->dst, entry->size_written))
continue;
/* If the type sizes don't match each channel of the instruction is