aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--src/panfrost/bifrost/bi_pack.c21
-rw-r--r--src/panfrost/bifrost/bi_tables.c12
-rw-r--r--src/panfrost/bifrost/compiler.h5
3 files changed, 28 insertions, 10 deletions
diff --git a/src/panfrost/bifrost/bi_pack.c b/src/panfrost/bifrost/bi_pack.c
index 377990f83be..65218b23010 100644
--- a/src/panfrost/bifrost/bi_pack.c
+++ b/src/panfrost/bifrost/bi_pack.c
@@ -110,15 +110,28 @@ bi_assign_ports(bi_bundle now, bi_bundle prev)
{
struct bi_registers regs = { 0 };
+ /* We assign ports for the main register mechanism. Special ops
+ * use the data registers, which has its own mechanism entirely
+ * and thus gets skipped over here. */
+
+ unsigned read_dreg = now.add &&
+ bi_class_props[now.add->type] & BI_DATA_REG_SRC;
+
+ unsigned write_dreg = prev.add &&
+ bi_class_props[prev.add->type] & BI_DATA_REG_DEST;
+
/* First, assign reads */
if (now.fma)
bi_foreach_src(now.fma, src)
bi_assign_port_read(&regs, now.fma->src[src]);
- if (now.add)
- bi_foreach_src(now.add, src)
- bi_assign_port_read(&regs, now.add->src[src]);
+ if (now.add) {
+ bi_foreach_src(now.add, src) {
+ if (!(src == 0 && read_dreg))
+ bi_assign_port_read(&regs, now.add->src[src]);
+ }
+ }
/* Next, assign writes */
@@ -127,7 +140,7 @@ bi_assign_ports(bi_bundle now, bi_bundle prev)
regs.write_fma = true;
}
- if (prev.add && prev.add->dest & BIR_INDEX_REGISTER) {
+ if (prev.add && prev.add->dest & BIR_INDEX_REGISTER && !write_dreg) {
unsigned r = prev.add->dest & ~BIR_INDEX_REGISTER;
if (regs.write_fma) {
diff --git a/src/panfrost/bifrost/bi_tables.c b/src/panfrost/bifrost/bi_tables.c
index a0734e10ec9..07dde05e027 100644
--- a/src/panfrost/bifrost/bi_tables.c
+++ b/src/panfrost/bifrost/bi_tables.c
@@ -39,16 +39,16 @@ unsigned bi_class_props[BI_NUM_CLASSES] = {
[BI_FMA] = BI_ROUNDMODE | BI_SCHED_FMA,
[BI_FREXP] = BI_SCHED_ALL,
[BI_ISUB] = BI_GENERIC | BI_SCHED_ALL,
- [BI_LOAD] = BI_SCHED_HI_LATENCY | BI_VECTOR,
- [BI_LOAD_UNIFORM] = BI_SCHED_HI_LATENCY | BI_VECTOR,
- [BI_LOAD_ATTR] = BI_SCHED_HI_LATENCY | BI_VECTOR,
- [BI_LOAD_VAR] = BI_SCHED_HI_LATENCY | BI_VECTOR,
+ [BI_LOAD] = BI_SCHED_HI_LATENCY | BI_VECTOR | BI_DATA_REG_DEST,
+ [BI_LOAD_UNIFORM] = BI_SCHED_HI_LATENCY | BI_VECTOR | BI_DATA_REG_DEST,
+ [BI_LOAD_ATTR] = BI_SCHED_HI_LATENCY | BI_VECTOR | BI_DATA_REG_DEST,
+ [BI_LOAD_VAR] = BI_SCHED_HI_LATENCY | BI_VECTOR | BI_DATA_REG_DEST,
[BI_LOAD_VAR_ADDRESS] = BI_SCHED_HI_LATENCY,
[BI_MINMAX] = BI_GENERIC | BI_SCHED_ALL,
[BI_MOV] = BI_MODS | BI_SCHED_ALL,
[BI_SHIFT] = BI_SCHED_ALL,
- [BI_STORE] = BI_SCHED_HI_LATENCY | BI_VECTOR,
- [BI_STORE_VAR] = BI_SCHED_HI_LATENCY | BI_VECTOR,
+ [BI_STORE] = BI_SCHED_HI_LATENCY | BI_VECTOR | BI_DATA_REG_SRC,
+ [BI_STORE_VAR] = BI_SCHED_HI_LATENCY | BI_VECTOR | BI_DATA_REG_SRC,
[BI_SPECIAL] = BI_SCHED_ADD | BI_SCHED_SLOW,
[BI_SWIZZLE] = BI_SCHED_ALL | BI_SWIZZLABLE,
[BI_TEX] = BI_SCHED_HI_LATENCY | BI_VECTOR,
diff --git a/src/panfrost/bifrost/compiler.h b/src/panfrost/bifrost/compiler.h
index b69c0fee5e7..2d3633502ec 100644
--- a/src/panfrost/bifrost/compiler.h
+++ b/src/panfrost/bifrost/compiler.h
@@ -113,6 +113,11 @@ extern unsigned bi_class_props[BI_NUM_CLASSES];
/* Intrinsic is vectorized and should read 4 components regardless of writemask */
#define BI_VECTOR (1 << 8)
+/* Use a data register for src0/dest respectively, bypassing the usual
+ * register accessor. Mutually exclusive. */
+#define BI_DATA_REG_SRC (1 << 9)
+#define BI_DATA_REG_DEST (1 << 10)
+
/* It can't get any worse than csel4... can it? */
#define BIR_SRC_COUNT 4