diff options
author | Eric Anholt <[email protected]> | 2016-07-08 16:23:38 -0700 |
---|---|---|
committer | Eric Anholt <[email protected]> | 2016-07-13 23:54:15 -0700 |
commit | ee69cfd11d34e6570c579c42f9cd8b5c8ea36bcf (patch) | |
tree | 5a8a817d69a9ca12e870dc89453ff988bedd550c | |
parent | 4e797bd98f3aaea8d295c661f7501053156d211a (diff) |
vc4: Convert vc4_opt_dead_code to work in the presence of control flow.
With control flow, we can't be sure that we'll see the uses of a variable
before its def as we walk backwards. Given that NIR is eliminating our
long chains of dead code, a simple solution for now seems fine.
This slightly changes the order of some optimizations, and so an opt_vpm
happens before opt_dce, causing 3 dead MOVs to be turned into dead FMAXes
in Minecraft:
instructions in affected programs: 52 -> 54 (3.85%)
-rw-r--r-- | src/gallium/drivers/vc4/vc4_opt_dead_code.c | 47 |
1 files changed, 29 insertions, 18 deletions
diff --git a/src/gallium/drivers/vc4/vc4_opt_dead_code.c b/src/gallium/drivers/vc4/vc4_opt_dead_code.c index 26fa3ed5435..f516d388429 100644 --- a/src/gallium/drivers/vc4/vc4_opt_dead_code.c +++ b/src/gallium/drivers/vc4/vc4_opt_dead_code.c @@ -24,11 +24,15 @@ /** * @file vc4_opt_dead_code.c * - * This is a simmple dead code eliminator for QIR with no control flow. + * This is a simple dead code eliminator for SSA values in QIR. * - * It walks from the bottom of the instruction list, removing instructions - * with a destination that is never used, and marking the sources of non-dead - * instructions as used. + * It walks all the instructions finding what temps are used, then walks again + * to remove instructions writing unused temps. + * + * This is an inefficient implementation if you have long chains of + * instructions where the entire chain is dead, but we expect those to have + * been eliminated at the NIR level, and here we're just cleaning up small + * problems produced by NIR->QIR. */ #include "vc4_qir.h" @@ -83,15 +87,27 @@ qir_opt_dead_code(struct vc4_compile *c) bool progress = false; bool *used = calloc(c->num_temps, sizeof(bool)); - list_for_each_entry_safe_rev(struct qinst, inst, - &c->cur_block->instructions, - link) { - if ((inst->dst.file == QFILE_NULL || - (inst->dst.file == QFILE_TEMP && - !used[inst->dst.index])) && - !inst->sf && - !qir_has_side_effects(c, inst) && - !has_nonremovable_reads(c, inst)) { + qir_for_each_inst_inorder(inst, c) { + for (int i = 0; i < qir_get_op_nsrc(inst->op); i++) { + if (inst->src[i].file == QFILE_TEMP) + used[inst->src[i].index] = true; + } + } + + qir_for_each_block(block, c) { + qir_for_each_inst_safe(inst, block) { + if (inst->dst.file != QFILE_NULL && + !(inst->dst.file == QFILE_TEMP && + !used[inst->dst.index])) { + continue; + } + + if (inst->sf || + qir_has_side_effects(c, inst) || + has_nonremovable_reads(c, inst)) { + continue; + } + for (int i = 0; i < qir_get_op_nsrc(inst->op); i++) { if (inst->src[i].file != QFILE_VPM) continue; @@ -108,11 +124,6 @@ qir_opt_dead_code(struct vc4_compile *c) progress = true; continue; } - - for (int i = 0; i < qir_get_op_nsrc(inst->op); i++) { - if (inst->src[i].file == QFILE_TEMP) - used[inst->src[i].index] = true; - } } free(used); |