summaryrefslogtreecommitdiffstats
path: root/src/intel/compiler/brw_compiler.c
diff options
context:
space:
mode:
authorSagar Ghuge <[email protected]>2019-02-14 23:08:39 -0800
committerSagar Ghuge <[email protected]>2019-03-04 15:50:25 -0800
commite551040c602d392019e68f54d9a3a310d2a937a3 (patch)
treed36046c91c6f69f2a8b9fd561add2b1cc9e820b2 /src/intel/compiler/brw_compiler.c
parent1d363d440f261fbadc1db3c17acc514b7130d505 (diff)
nir/glsl: Add another way of doing lower_imul64 for gen8+
On Gen 8 and 9, "mul" instruction supports 64 bit destination type. We can reduce our 64x64 int multiplication from 4 instructions to 3. Also instead of emitting two mul instructions, we can emit single mul instuction and extract low/high 32 bits from 64 bit result for [i/u]mulExtended v2: 1) Allow lower_mul_high64 to use new opcode (Jason Ekstrand) 2) Add lower_mul_2x32_64 flag (Matt Turner) 3) Remove associative property as bit size is different (Connor Abbott) v3: Fix indentation and variable naming convention (Jason Ekstrand) Signed-off-by: Sagar Ghuge <[email protected]> Reviewed-by: Jason Ekstrand <[email protected]>
Diffstat (limited to 'src/intel/compiler/brw_compiler.c')
-rw-r--r--src/intel/compiler/brw_compiler.c7
1 files changed, 7 insertions, 0 deletions
diff --git a/src/intel/compiler/brw_compiler.c b/src/intel/compiler/brw_compiler.c
index b3df0d9fa23..28793b1f0e6 100644
--- a/src/intel/compiler/brw_compiler.c
+++ b/src/intel/compiler/brw_compiler.c
@@ -171,6 +171,13 @@ brw_compiler_create(void *mem_ctx, const struct gen_device_info *devinfo)
fp64_options |= nir_lower_fp64_full_software;
}
+ /* The Bspec's section tittled "Instruction_multiply[DevBDW+]" claims that
+ * destination type can be Quadword and source type Doubleword for Gen8 and
+ * Gen9. So, lower 64 bit multiply instruction on rest of the platforms.
+ */
+ if (devinfo->gen < 8 || devinfo->gen > 9)
+ int64_options |= nir_lower_imul_2x32_64;
+
/* We want the GLSL compiler to emit code that uses condition codes */
for (int i = 0; i < MESA_SHADER_STAGES; i++) {
compiler->glsl_compiler_options[i].MaxUnrollIterations = 0;