diff options
author | Rob Clark <[email protected]> | 2019-08-02 14:07:47 -0700 |
---|---|---|
committer | Rob Clark <[email protected]> | 2019-08-13 08:11:26 -0700 |
commit | 882d53d8e36592a39cde947e890969a81b2b1226 (patch) | |
tree | 83dda78788887d601ad1d23e7eca50914af9f8e3 /src/freedreno/ir3/ir3_ra.c | |
parent | 4b82d1bbb723e77f278d9348e8437cf12811e0ca (diff) |
freedreno/ir3+a6xx: same VBO state for draw/binning
Worth ~+20% on gl_driver2
Signed-off-by: Rob Clark <[email protected]>
Diffstat (limited to 'src/freedreno/ir3/ir3_ra.c')
-rw-r--r-- | src/freedreno/ir3/ir3_ra.c | 91 |
1 files changed, 88 insertions, 3 deletions
diff --git a/src/freedreno/ir3/ir3_ra.c b/src/freedreno/ir3/ir3_ra.c index 980cd62c48b..a641661a441 100644 --- a/src/freedreno/ir3/ir3_ra.c +++ b/src/freedreno/ir3/ir3_ra.c @@ -330,6 +330,7 @@ struct ir3_ra_instr_data { /* register-assign context, per-shader */ struct ir3_ra_ctx { + struct ir3_shader_variant *v; struct ir3 *ir; struct ir3_ra_reg_set *set; @@ -1091,6 +1092,60 @@ ra_block_alloc(struct ir3_ra_ctx *ctx, struct ir3_block *block) static int ra_alloc(struct ir3_ra_ctx *ctx) { + /* Pre-assign VS inputs on a6xx+ binning pass shader, to align + * with draw pass VS, so binning and draw pass can both use the + * same VBO state. + * + * Note that VS inputs are expected to be full precision. + */ + bool pre_assign_inputs = (ctx->ir->compiler->gpu_id >= 600) && + (ctx->ir->type == MESA_SHADER_VERTEX) && + ctx->v->binning_pass; + + if (pre_assign_inputs) { + for (unsigned i = 0; i < ctx->ir->ninputs; i++) { + struct ir3_instruction *instr = ctx->ir->inputs[i]; + + if (!instr) + continue; + + debug_assert(!(instr->regs[0]->flags & (IR3_REG_HALF | IR3_REG_HIGH))); + + struct ir3_ra_instr_data *id = &ctx->instrd[instr->ip]; + + /* only consider the first component: */ + if (id->off > 0) + continue; + + unsigned name = ra_name(ctx, id); + + unsigned n = i / 4; + unsigned c = i % 4; + + /* 'base' is in scalar (class 0) but we need to map that + * the conflicting register of the appropriate class (ie. + * input could be vec2/vec3/etc) + * + * Note that the higher class (larger than scalar) regs + * are setup to conflict with others in the same class, + * so for example, R1 (scalar) is also the first component + * of D1 (vec2/double): + * + * Single (base) | Double + * --------------+--------------- + * R0 | D0 + * R1 | D0 D1 + * R2 | D1 D2 + * R3 | D2 + * .. and so on.. + */ + unsigned reg = ctx->set->gpr_to_ra_reg[id->cls] + [ctx->v->nonbinning->inputs[n].regid + c]; + + ra_set_node_reg(ctx->g, name, reg); + } + } + /* pre-assign array elements: */ list_for_each_entry (struct ir3_array, arr, &ctx->ir->array_list, node) { @@ -1118,6 +1173,35 @@ retry: } } + /* also need to not conflict with any pre-assigned inputs: */ + if (pre_assign_inputs) { + for (unsigned i = 0; i < ctx->ir->ninputs; i++) { + struct ir3_instruction *instr = ctx->ir->inputs[i]; + + if (!instr) + continue; + + struct ir3_ra_instr_data *id = &ctx->instrd[instr->ip]; + + /* only consider the first component: */ + if (id->off > 0) + continue; + + unsigned name = ra_name(ctx, id); + + /* Check if array intersects with liverange AND register + * range of the input: + */ + if (intersects(arr->start_ip, arr->end_ip, + ctx->def[name], ctx->use[name]) && + intersects(base, base + arr->length, + i, i + class_sizes[id->cls])) { + base = MAX2(base, i + class_sizes[id->cls]); + goto retry; + } + } + } + arr->reg = base; for (unsigned i = 0; i < arr->length; i++) { @@ -1140,11 +1224,12 @@ retry: return 0; } -int ir3_ra(struct ir3 *ir) +int ir3_ra(struct ir3_shader_variant *v) { struct ir3_ra_ctx ctx = { - .ir = ir, - .set = ir->compiler->set, + .v = v, + .ir = v->ir, + .set = v->ir->compiler->set, }; int ret; |