nir: Add new instructions for INTEL_shader_integer_functions2

uctz isn't added because it will implemented in the GLSL path and the SPIR-V path using other pre-existing instructions. v2: Avoid signed integer overflow for uabs_isub(0, INT_MIN). Noticed by Caio. v3: Alternate fix for signed integer overflow for abs_sub(0, INT_MIN). I tried the previous methon in a small test program with -ftrapv, and it failed. Reviewed-by: Caio Marcelo de Oliveira Filho <[email protected]> [v1] Part-of: <https://gitlab.freedesktop.org/mesa/mesa/merge_requests/767>
author: Ian Romanick <[email protected]> 2018-09-11 00:13:36 -0700
committer: Marge Bot <[email protected]> 2020-01-23 00:18:57 +0000
commit: 21f0d020fe2518da008c86cb111579e7f0e636b5 (patch)
tree: 36f136e8b2125ddf08d768741e58534cbc66b87a /src/compiler
parent: cb518df775f222e34a4e724be2fa825df9388b0a (diff)
1 files changed, 17 insertions, 0 deletions
diff --git a/src/compiler/nir/nir_opcodes.py b/src/compiler/nir/nir_opcodes.py
index 86485e39508..bee7322b642 100644
--- a/src/compiler/nir/nir_opcodes.py
+++ b/src/compiler/nir/nir_opcodes.py
@@ -419,6 +419,15 @@ for (int bit = bit_size - 1; bit >= 0; bit--) {
 }
 """)
 
+unop("uclz", tuint32, """
+int bit;
+for (bit = bit_size - 1; bit >= 0; bit--) {
+   if ((src0 & (1u << bit)) != 0)
+      break;
+}
+dst = (unsigned)(31 - bit);
+""")
+
 unop("ifind_msb", tint32, """
 dst = -1;
 for (int bit = 31; bit >= 0; bit--) {
@@ -586,6 +595,11 @@ if (nir_is_rounding_mode_rtz(execution_mode, bit_size)) {
 }
 """)
 binop("isub", tint, "", "src0 - src1")
+binop_convert("uabs_isub", tuint, tint, "", """
+              src1 > src0 ? (uint64_t) src1 - (uint64_t) src0
+                          : (uint64_t) src0 - (uint64_t) src1
+""")
+binop("uabs_usub", tuint, "", "(src1 > src0) ? (src1 - src0) : (src0 - src1)")
 
 binop("fmul", tfloat, _2src_commutative + associative, """
 if (nir_is_rounding_mode_rtz(execution_mode, bit_size)) {
@@ -653,6 +667,9 @@ uint64_t mask = (1 << (bit_size / 2)) - 1;
 dst = ((uint64_t)src0 & mask) * ((uint64_t)src1 & mask);
 """)
 
+# Multiply 32-bits with low 16-bits.
+binop("imul_32x16", tint32, "", "src0 * (int16_t) src1")
+binop("umul_32x16", tuint32, "", "src0 * (uint16_t) src1")
 
 binop("fdiv", tfloat, "", "src0 / src1")
 binop("idiv", tint, "", "src1 == 0 ? 0 : (src0 / src1)")
author	Ian Romanick <[email protected]>	2018-09-11 00:13:36 -0700
committer	Marge Bot <[email protected]>	2020-01-23 00:18:57 +0000
commit	21f0d020fe2518da008c86cb111579e7f0e636b5 (patch)
tree	36f136e8b2125ddf08d768741e58534cbc66b87a /src/compiler
parent	cb518df775f222e34a4e724be2fa825df9388b0a (diff)