diff options
author | Eric Anholt <[email protected]> | 2018-08-01 16:37:08 -0700 |
---|---|---|
committer | Eric Anholt <[email protected]> | 2018-08-06 13:03:23 -0700 |
commit | ccbe33af5b086f4b488ac7ca8a8a45ebc9ac189c (patch) | |
tree | f66e3ad497a91b02227a939920c8ea23b6ca8c53 | |
parent | f9d54dc3cf45ba6f15f74627b8ec527975ce5297 (diff) |
v3d: Make sure we don't emit a thrsw before the last one finished.
Found while forcing some spilling, which creates a lot of short
tmua->thrsw->ldtmu sequences.
Cc: "18.2" <[email protected]>
-rw-r--r-- | src/broadcom/compiler/qpu_schedule.c | 15 |
1 files changed, 13 insertions, 2 deletions
diff --git a/src/broadcom/compiler/qpu_schedule.c b/src/broadcom/compiler/qpu_schedule.c index fb5ecd6410c..4f3b621fd29 100644 --- a/src/broadcom/compiler/qpu_schedule.c +++ b/src/broadcom/compiler/qpu_schedule.c @@ -462,6 +462,7 @@ struct choose_scoreboard { int last_magic_sfu_write_tick; int last_ldvary_tick; int last_uniforms_reset_tick; + int last_thrsw_tick; bool tlb_locked; }; @@ -1095,10 +1096,16 @@ qpu_instruction_valid_in_thrend_slot(struct v3d_compile *c, } static bool -valid_thrsw_sequence(struct v3d_compile *c, +valid_thrsw_sequence(struct v3d_compile *c, struct choose_scoreboard *scoreboard, struct qinst *qinst, int instructions_in_sequence, bool is_thrend) { + /* No emitting our thrsw while the previous thrsw hasn't happened yet. */ + if (scoreboard->last_thrsw_tick + 3 > + scoreboard->tick - instructions_in_sequence) { + return false; + } + for (int slot = 0; slot < instructions_in_sequence; slot++) { /* No scheduling SFU when the result would land in the other * thread. The simulator complains for safety, though it @@ -1159,7 +1166,8 @@ emit_thrsw(struct v3d_compile *c, if (!v3d_qpu_sig_pack(c->devinfo, &sig, &packed_sig)) break; - if (!valid_thrsw_sequence(c, prev_inst, slots_filled + 1, + if (!valid_thrsw_sequence(c, scoreboard, + prev_inst, slots_filled + 1, is_thrend)) { break; } @@ -1173,7 +1181,9 @@ emit_thrsw(struct v3d_compile *c, if (merge_inst) { merge_inst->qpu.sig.thrsw = true; needs_free = true; + scoreboard->last_thrsw_tick = scoreboard->tick - slots_filled; } else { + scoreboard->last_thrsw_tick = scoreboard->tick; insert_scheduled_instruction(c, block, scoreboard, inst); time++; slots_filled++; @@ -1475,6 +1485,7 @@ v3d_qpu_schedule_instructions(struct v3d_compile *c) scoreboard.last_ldvary_tick = -10; scoreboard.last_magic_sfu_write_tick = -10; scoreboard.last_uniforms_reset_tick = -10; + scoreboard.last_thrsw_tick = -10; if (debug) { fprintf(stderr, "Pre-schedule instructions\n"); |