aboutsummaryrefslogtreecommitdiffstats
path: root/src/amd/compiler/aco_reduce_assign.cpp
diff options
context:
space:
mode:
authorDaniel Schürmann <[email protected]>2019-11-20 16:53:42 +0100
committerDaniel Schürmann <[email protected]>2019-12-07 11:23:11 +0100
commitf895a8b1df937488e7db3e444897f6612a59048f (patch)
tree4709972201ea9a70ef7ef47a8b09db234fb637b7 /src/amd/compiler/aco_reduce_assign.cpp
parent9254fb4fc72ed289ffded28ef067b4582973e90c (diff)
aco: implement (clustered) reductions for SI/CI
Reviewed-by: Rhys Perry <[email protected]>
Diffstat (limited to 'src/amd/compiler/aco_reduce_assign.cpp')
-rw-r--r--src/amd/compiler/aco_reduce_assign.cpp2
1 files changed, 2 insertions, 0 deletions
diff --git a/src/amd/compiler/aco_reduce_assign.cpp b/src/amd/compiler/aco_reduce_assign.cpp
index f1015b13316..58c64cfb019 100644
--- a/src/amd/compiler/aco_reduce_assign.cpp
+++ b/src/amd/compiler/aco_reduce_assign.cpp
@@ -125,6 +125,8 @@ void setup_reduce_temp(Program* program)
need_vtmp = true;
if (program->chip_class >= GFX10 && op == iadd64)
need_vtmp = true;
+ if (program->chip_class <= GFX7)
+ need_vtmp = true;
need_vtmp |= cluster_size == 32;