summaryrefslogtreecommitdiffstats
path: root/src/gallium/drivers
diff options
context:
space:
mode:
authorEric Anholt <[email protected]>2016-05-02 13:35:21 -0700
committerEric Anholt <[email protected]>2016-07-12 17:42:42 -0700
commit420845acb2207cb9d903e67b66deaf08637ac3b2 (patch)
tree318be1b4821563c6adf5718fac1979f02c56d147 /src/gallium/drivers
parent0adf2ec0eefa70905fb9ca45c1681149c0688ce9 (diff)
vc4: Add support for NIR loops and break/continue.
Diffstat (limited to 'src/gallium/drivers')
-rw-r--r--src/gallium/drivers/vc4/vc4_program.c80
-rw-r--r--src/gallium/drivers/vc4/vc4_qir.h2
2 files changed, 79 insertions, 3 deletions
diff --git a/src/gallium/drivers/vc4/vc4_program.c b/src/gallium/drivers/vc4/vc4_program.c
index cb3ef6e45f3..465e052053e 100644
--- a/src/gallium/drivers/vc4/vc4_program.c
+++ b/src/gallium/drivers/vc4/vc4_program.c
@@ -1764,6 +1764,27 @@ ntq_emit_if(struct vc4_compile *c, nir_if *if_stmt)
}
static void
+ntq_emit_jump(struct vc4_compile *c, nir_jump_instr *jump)
+{
+ switch (jump->type) {
+ case nir_jump_break:
+ qir_SF(c, c->execute);
+ qir_MOV_cond(c, QPU_COND_ZS, c->execute,
+ qir_uniform_ui(c, c->loop_break_block->index));
+ break;
+
+ case nir_jump_continue:
+ qir_SF(c, c->execute);
+ qir_MOV_cond(c, QPU_COND_ZS, c->execute,
+ qir_uniform_ui(c, c->loop_cont_block->index));
+ break;
+
+ case nir_jump_return:
+ unreachable("All returns shouold be lowered\n");
+ }
+}
+
+static void
ntq_emit_instr(struct vc4_compile *c, nir_instr *instr)
{
switch (instr->type) {
@@ -1787,6 +1808,10 @@ ntq_emit_instr(struct vc4_compile *c, nir_instr *instr)
ntq_emit_tex(c, nir_instr_as_tex(instr));
break;
+ case nir_instr_type_jump:
+ ntq_emit_jump(c, nir_instr_as_jump(instr));
+ break;
+
default:
fprintf(stderr, "Unknown NIR instr type: ");
nir_print_instr(instr, stderr);
@@ -1806,10 +1831,59 @@ ntq_emit_block(struct vc4_compile *c, nir_block *block)
static void ntq_emit_cf_list(struct vc4_compile *c, struct exec_list *list);
static void
-ntq_emit_loop(struct vc4_compile *c, nir_loop *nloop)
+ntq_emit_loop(struct vc4_compile *c, nir_loop *loop)
{
- fprintf(stderr, "LOOPS not fully handled. Rendering errors likely.\n");
- ntq_emit_cf_list(c, &nloop->body);
+ if (!c->vc4->screen->has_control_flow) {
+ fprintf(stderr,
+ "loop support requires updated kernel.\n");
+ ntq_emit_cf_list(c, &loop->body);
+ return;
+ }
+
+ bool was_top_level = false;
+ if (c->execute.file == QFILE_NULL) {
+ c->execute = qir_MOV(c, qir_uniform_ui(c, 0));
+ was_top_level = true;
+ }
+
+ struct qblock *save_loop_cont_block = c->loop_cont_block;
+ struct qblock *save_loop_break_block = c->loop_break_block;
+
+ c->loop_cont_block = qir_new_block(c);
+ c->loop_break_block = qir_new_block(c);
+
+ qir_link_blocks(c->cur_block, c->loop_cont_block);
+ qir_set_emit_block(c, c->loop_cont_block);
+ ntq_activate_execute_for_block(c);
+
+ ntq_emit_cf_list(c, &loop->body);
+
+ /* If anything had explicitly continued, or is here at the end of the
+ * loop, then we need to loop again. SF updates are masked by the
+ * instruction's condition, so we can do the OR of the two conditions
+ * within SF.
+ */
+ qir_SF(c, c->execute);
+ struct qinst *cont_check =
+ qir_SUB_dest(c,
+ c->undef,
+ c->execute,
+ qir_uniform_ui(c, c->loop_cont_block->index));
+ cont_check->cond = QPU_COND_ZC;
+ cont_check->sf = true;
+
+ qir_BRANCH(c, QPU_COND_BRANCH_ANY_ZS);
+ qir_link_blocks(c->cur_block, c->loop_cont_block);
+ qir_link_blocks(c->cur_block, c->loop_break_block);
+
+ qir_set_emit_block(c, c->loop_break_block);
+ if (was_top_level)
+ c->execute = c->undef;
+ else
+ ntq_activate_execute_for_block(c);
+
+ c->loop_break_block = save_loop_break_block;
+ c->loop_cont_block = save_loop_cont_block;
}
static void
diff --git a/src/gallium/drivers/vc4/vc4_qir.h b/src/gallium/drivers/vc4/vc4_qir.h
index e284ed58b65..fe85b769775 100644
--- a/src/gallium/drivers/vc4/vc4_qir.h
+++ b/src/gallium/drivers/vc4/vc4_qir.h
@@ -463,6 +463,8 @@ struct vc4_compile {
struct list_head blocks;
int next_block_index;
struct qblock *cur_block;
+ struct qblock *loop_cont_block;
+ struct qblock *loop_break_block;
struct list_head qpu_inst_list;
uint64_t *qpu_insts;