diff options
author | Vincent Lejeune <[email protected]> | 2012-09-17 22:20:18 +0200 |
---|---|---|
committer | Vincent Lejeune <[email protected]> | 2012-09-18 18:00:20 +0200 |
commit | 175fdd7b86cce4e1fc945058fa2223b77edbf8a6 (patch) | |
tree | b5346a727226a4fb8138a49e2e843b85cf3d2434 | |
parent | 12c4526157ab029fd8c0b402d190cf5f7723b555 (diff) |
radeon/llvm: Add a fdiv pattern.
Reviewed-by: Tom Stellard <thomas.stellard at amd.com>
-rw-r--r-- | src/gallium/drivers/radeon/R600Instructions.td | 13 |
1 files changed, 10 insertions, 3 deletions
diff --git a/src/gallium/drivers/radeon/R600Instructions.td b/src/gallium/drivers/radeon/R600Instructions.td index 8d2f137434c..e2f8d338cc3 100644 --- a/src/gallium/drivers/radeon/R600Instructions.td +++ b/src/gallium/drivers/radeon/R600Instructions.td @@ -702,11 +702,18 @@ class COS_Common <bits<32> inst> : R600_1OP < // Helper patterns for complex intrinsics //===----------------------------------------------------------------------===// -class DIV_Common <InstR600 recip_ieee> : Pat< +multiclass DIV_Common <InstR600 recip_ieee> { +def : Pat< (int_AMDGPU_div R600_Reg32:$src0, R600_Reg32:$src1), (MUL R600_Reg32:$src0, (recip_ieee R600_Reg32:$src1)) >; +def : Pat< + (fdiv R600_Reg32:$src0, R600_Reg32:$src1), + (MUL R600_Reg32:$src0, (recip_ieee R600_Reg32:$src1)) +>; +} + class SSG_Common <InstR600 cndgt, InstR600 cndge> : Pat < (int_AMDGPU_ssg R600_Reg32:$src), (cndgt R600_Reg32:$src, (f32 ONE), (cndge R600_Reg32:$src, (f32 ZERO), (f32 NEG_ONE))) @@ -753,7 +760,7 @@ let Predicates = [isR600] in { def MULHI_UINT_r600 : MULHI_UINT_Common<0x76>; def RECIP_UINT_r600 : RECIP_UINT_Common <0x78>; - def DIV_r600 : DIV_Common<RECIP_IEEE_r600>; + defm DIV_r600 : DIV_Common<RECIP_IEEE_r600>; def POW_r600 : POW_Common<LOG_IEEE_r600, EXP_IEEE_r600, MUL, GPRF32>; def SSG_r600 : SSG_Common<CNDGT_r600, CNDGE_r600>; def TGSI_LIT_Z_r600 : TGSI_LIT_Z_Common<MUL_LIT_r600, LOG_CLAMPED_r600, EXP_IEEE_r600>; @@ -849,7 +856,7 @@ let Predicates = [isEGorCayman] in { def : DOT4_Pat <DOT4_eg>; defm CUBE_eg : CUBE_Common<0xC0>; - def DIV_eg : DIV_Common<RECIP_IEEE_eg>; + defm DIV_eg : DIV_Common<RECIP_IEEE_eg>; def POW_eg : POW_Common<LOG_IEEE_eg, EXP_IEEE_eg, MUL, GPRF32>; def SSG_eg : SSG_Common<CNDGT_eg, CNDGE_eg>; def TGSI_LIT_Z_eg : TGSI_LIT_Z_Common<MUL_LIT_eg, LOG_CLAMPED_eg, EXP_IEEE_eg>; |