diff options
author | Daniel Schürmann <[email protected]> | 2019-11-20 16:53:42 +0100 |
---|---|---|
committer | Daniel Schürmann <[email protected]> | 2019-12-07 11:23:11 +0100 |
commit | f895a8b1df937488e7db3e444897f6612a59048f (patch) | |
tree | 4709972201ea9a70ef7ef47a8b09db234fb637b7 /src/amd/compiler/aco_reduce_assign.cpp | |
parent | 9254fb4fc72ed289ffded28ef067b4582973e90c (diff) |
aco: implement (clustered) reductions for SI/CI
Reviewed-by: Rhys Perry <[email protected]>
Diffstat (limited to 'src/amd/compiler/aco_reduce_assign.cpp')
-rw-r--r-- | src/amd/compiler/aco_reduce_assign.cpp | 2 |
1 files changed, 2 insertions, 0 deletions
diff --git a/src/amd/compiler/aco_reduce_assign.cpp b/src/amd/compiler/aco_reduce_assign.cpp index f1015b13316..58c64cfb019 100644 --- a/src/amd/compiler/aco_reduce_assign.cpp +++ b/src/amd/compiler/aco_reduce_assign.cpp @@ -125,6 +125,8 @@ void setup_reduce_temp(Program* program) need_vtmp = true; if (program->chip_class >= GFX10 && op == iadd64) need_vtmp = true; + if (program->chip_class <= GFX7) + need_vtmp = true; need_vtmp |= cluster_size == 32; |