summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorEric Anholt <[email protected]>2016-07-08 16:23:38 -0700
committerEric Anholt <[email protected]>2016-07-13 23:54:15 -0700
commitee69cfd11d34e6570c579c42f9cd8b5c8ea36bcf (patch)
tree5a8a817d69a9ca12e870dc89453ff988bedd550c
parent4e797bd98f3aaea8d295c661f7501053156d211a (diff)
vc4: Convert vc4_opt_dead_code to work in the presence of control flow.
With control flow, we can't be sure that we'll see the uses of a variable before its def as we walk backwards. Given that NIR is eliminating our long chains of dead code, a simple solution for now seems fine. This slightly changes the order of some optimizations, and so an opt_vpm happens before opt_dce, causing 3 dead MOVs to be turned into dead FMAXes in Minecraft: instructions in affected programs: 52 -> 54 (3.85%)
-rw-r--r--src/gallium/drivers/vc4/vc4_opt_dead_code.c47
1 files changed, 29 insertions, 18 deletions
diff --git a/src/gallium/drivers/vc4/vc4_opt_dead_code.c b/src/gallium/drivers/vc4/vc4_opt_dead_code.c
index 26fa3ed5435..f516d388429 100644
--- a/src/gallium/drivers/vc4/vc4_opt_dead_code.c
+++ b/src/gallium/drivers/vc4/vc4_opt_dead_code.c
@@ -24,11 +24,15 @@
/**
* @file vc4_opt_dead_code.c
*
- * This is a simmple dead code eliminator for QIR with no control flow.
+ * This is a simple dead code eliminator for SSA values in QIR.
*
- * It walks from the bottom of the instruction list, removing instructions
- * with a destination that is never used, and marking the sources of non-dead
- * instructions as used.
+ * It walks all the instructions finding what temps are used, then walks again
+ * to remove instructions writing unused temps.
+ *
+ * This is an inefficient implementation if you have long chains of
+ * instructions where the entire chain is dead, but we expect those to have
+ * been eliminated at the NIR level, and here we're just cleaning up small
+ * problems produced by NIR->QIR.
*/
#include "vc4_qir.h"
@@ -83,15 +87,27 @@ qir_opt_dead_code(struct vc4_compile *c)
bool progress = false;
bool *used = calloc(c->num_temps, sizeof(bool));
- list_for_each_entry_safe_rev(struct qinst, inst,
- &c->cur_block->instructions,
- link) {
- if ((inst->dst.file == QFILE_NULL ||
- (inst->dst.file == QFILE_TEMP &&
- !used[inst->dst.index])) &&
- !inst->sf &&
- !qir_has_side_effects(c, inst) &&
- !has_nonremovable_reads(c, inst)) {
+ qir_for_each_inst_inorder(inst, c) {
+ for (int i = 0; i < qir_get_op_nsrc(inst->op); i++) {
+ if (inst->src[i].file == QFILE_TEMP)
+ used[inst->src[i].index] = true;
+ }
+ }
+
+ qir_for_each_block(block, c) {
+ qir_for_each_inst_safe(inst, block) {
+ if (inst->dst.file != QFILE_NULL &&
+ !(inst->dst.file == QFILE_TEMP &&
+ !used[inst->dst.index])) {
+ continue;
+ }
+
+ if (inst->sf ||
+ qir_has_side_effects(c, inst) ||
+ has_nonremovable_reads(c, inst)) {
+ continue;
+ }
+
for (int i = 0; i < qir_get_op_nsrc(inst->op); i++) {
if (inst->src[i].file != QFILE_VPM)
continue;
@@ -108,11 +124,6 @@ qir_opt_dead_code(struct vc4_compile *c)
progress = true;
continue;
}
-
- for (int i = 0; i < qir_get_op_nsrc(inst->op); i++) {
- if (inst->src[i].file == QFILE_TEMP)
- used[inst->src[i].index] = true;
- }
}
free(used);