aboutsummaryrefslogtreecommitdiffstats
path: root/src/gallium/auxiliary/gallivm
diff options
context:
space:
mode:
authorKrzysztof Raszkowski <[email protected]>2019-12-05 18:01:08 +0100
committerKrzysztof Raszkowski <[email protected]>2019-12-10 10:34:18 +0000
commitcfe00a52f013dbab52a10705dfdf58b893578d11 (patch)
tree7db745f863c178e2d89bbdbb5075e3faf98d3732 /src/gallium/auxiliary/gallivm
parent008fe909cac1449cac7cc71fca4c805cc6d3de95 (diff)
gallivm: add TGSI bit arithmetic opcodes support
Add TGSI_OPCODE_BFI, TGSI_OPCODE_POPC, TGSI_OPCODE_LSB, TGSI_OPCODE_IMSB, TGSI_OPCODE_UMSB, TGSI_OPCODE_IBFE, TGSI_OPCODE_UBFE, TGSI_OPCODE_BREV support. Reviewed-by: Dave Airlie <[email protected]> Reviewed-by: Jan Zielinski <[email protected]>
Diffstat (limited to 'src/gallium/auxiliary/gallivm')
-rw-r--r--src/gallium/auxiliary/gallivm/lp_bld_tgsi_action.c138
1 files changed, 138 insertions, 0 deletions
diff --git a/src/gallium/auxiliary/gallivm/lp_bld_tgsi_action.c b/src/gallium/auxiliary/gallivm/lp_bld_tgsi_action.c
index ce2b927db88..7cdd87260c2 100644
--- a/src/gallium/auxiliary/gallivm/lp_bld_tgsi_action.c
+++ b/src/gallium/auxiliary/gallivm/lp_bld_tgsi_action.c
@@ -2398,6 +2398,134 @@ u64shr_emit_cpu(
emit_data->output[emit_data->chan] = lp_build_shr(uint_bld, emit_data->args[0],
masked_count);
}
+static void bfi_emit_cpu(const struct lp_build_tgsi_action *action,
+ struct lp_build_tgsi_context *bld_base,
+ struct lp_build_emit_data *emit_data) {
+ /*
+ * def bfi(base, insert, offset, bits):
+ * if offset < 0 or bits < 0 or offset + bits > 32:
+ * return undefined
+ * # << defined such that mask == ~0 when bits == 32, offset == 0
+ * mask = ((1 << bits) - 1) << offset
+ * return ((insert << offset) & mask) | (base & ~mask)
+ */
+ struct lp_build_context *uint_bld = &bld_base->uint_bld;
+ LLVMValueRef one_shl_bits_dec_one = lp_build_sub(
+ uint_bld, lp_build_shl(uint_bld, uint_bld->one, emit_data->args[3]),
+ uint_bld->one);
+ LLVMValueRef mask =
+ lp_build_shl(uint_bld, one_shl_bits_dec_one, emit_data->args[2]);
+ LLVMValueRef insert_shl_offset =
+ lp_build_shl(uint_bld, emit_data->args[1], emit_data->args[2]);
+ LLVMValueRef insert_shl_offset_and_mask =
+ lp_build_and(uint_bld, insert_shl_offset, mask);
+ LLVMValueRef base_and_not_mask =
+ lp_build_and(uint_bld, emit_data->args[0], lp_build_not(uint_bld, mask));
+
+ emit_data->output[emit_data->chan] =
+ lp_build_or(uint_bld, insert_shl_offset_and_mask, base_and_not_mask);
+}
+
+static void lsb_emit_cpu(const struct lp_build_tgsi_action *action,
+ struct lp_build_tgsi_context *bld_base,
+ struct lp_build_emit_data *emit_data) {
+ struct lp_build_context *uint_bld = &bld_base->int_bld;
+
+ LLVMValueRef result = lp_build_cttz(uint_bld, emit_data->args[0]);
+ LLVMValueRef cond =
+ lp_build_cmp(uint_bld, PIPE_FUNC_LESS, result,
+ lp_build_const_vec(uint_bld->gallivm, uint_bld->type, 32));
+ emit_data->output[emit_data->chan] = lp_build_select(
+ uint_bld, cond, result,
+ lp_build_const_vec(uint_bld->gallivm, uint_bld->type, -1));
+}
+
+static void umsb_emit_cpu(const struct lp_build_tgsi_action *action,
+ struct lp_build_tgsi_context *bld_base,
+ struct lp_build_emit_data *emit_data) {
+ struct lp_build_context *uint_bld = &bld_base->int_bld;
+ emit_data->output[emit_data->chan] = lp_build_sub(
+ uint_bld, lp_build_const_vec(uint_bld->gallivm, uint_bld->type, 31),
+ lp_build_ctlz(uint_bld, emit_data->args[0]));
+}
+
+static void imsb_emit_cpu(const struct lp_build_tgsi_action *action,
+ struct lp_build_tgsi_context *bld_base,
+ struct lp_build_emit_data *emit_data) {
+ struct lp_build_context *uint_bld = &bld_base->int_bld;
+
+ LLVMValueRef cond =
+ lp_build_cmp(uint_bld, PIPE_FUNC_LESS, emit_data->args[0],
+ lp_build_const_vec(uint_bld->gallivm, uint_bld->type, 0));
+ emit_data->args[0] = lp_build_select(
+ uint_bld, cond, lp_build_not(uint_bld, emit_data->args[0]),
+ emit_data->args[0]);
+ umsb_emit_cpu(action, bld_base, emit_data);
+}
+
+static void popc_emit_cpu(const struct lp_build_tgsi_action *action,
+ struct lp_build_tgsi_context *bld_base,
+ struct lp_build_emit_data *emit_data) {
+ struct lp_build_context *uint_bld = &bld_base->int_bld;
+ emit_data->output[emit_data->chan] =
+ lp_build_popcount(uint_bld, emit_data->args[0]);
+}
+
+static void ibfe_emit_cpu(const struct lp_build_tgsi_action *action,
+ struct lp_build_tgsi_context *bld_base,
+ struct lp_build_emit_data *emit_data) {
+ /* def ibfe(value, offset, bits):
+ * if offset < 0 or bits < 0 or offset + bits > 32:
+ * return undefined
+ * if bits == 0: return 0
+ * # Note: >> sign-extends
+ * return (value << (32 - offset - bits)) >> (32 - bits)
+ */
+ struct lp_build_context *uint_bld = &bld_base->int_bld;
+
+ LLVMValueRef r_32_sub_bits = lp_build_sub(
+ uint_bld, lp_build_const_vec(uint_bld->gallivm, uint_bld->type, 32),
+ emit_data->args[2]);
+ LLVMValueRef temp1 =
+ lp_build_sub(uint_bld, r_32_sub_bits, emit_data->args[1]);
+ LLVMValueRef temp2 = lp_build_shl(uint_bld, emit_data->args[0], temp1);
+ LLVMValueRef cond =
+ lp_build_cmp(uint_bld, PIPE_FUNC_EQUAL, emit_data->args[2],
+ lp_build_const_vec(uint_bld->gallivm, uint_bld->type, 0));
+ emit_data->output[emit_data->chan] = lp_build_select(
+ uint_bld, cond, lp_build_const_vec(uint_bld->gallivm, uint_bld->type, 0),
+ lp_build_shr(uint_bld, temp2, r_32_sub_bits));
+}
+
+static void ubfe_emit_cpu(const struct lp_build_tgsi_action *action,
+ struct lp_build_tgsi_context *bld_base,
+ struct lp_build_emit_data *emit_data) {
+ /* def ubfe(value, offset, bits):
+ * if offset < 0 or bits < 0 or offset + bits > 32:
+ * return undefined
+ * if bits == 0: return 0
+ * # Note: >> does not sign-extend
+ * return (value << (32 - offset - bits)) >> (32 - bits)
+ */
+ struct lp_build_context *uint_bld = &bld_base->uint_bld;
+
+ LLVMValueRef r_32_sub_bits = lp_build_sub(
+ uint_bld, lp_build_const_vec(uint_bld->gallivm, uint_bld->type, 32),
+ emit_data->args[2]);
+ LLVMValueRef temp1 =
+ lp_build_sub(uint_bld, r_32_sub_bits, emit_data->args[1]);
+ LLVMValueRef temp2 = lp_build_shl(uint_bld, emit_data->args[0], temp1);
+ emit_data->output[emit_data->chan] =
+ lp_build_shr(uint_bld, temp2, r_32_sub_bits);
+}
+
+static void brev_emit_cpu(const struct lp_build_tgsi_action *action,
+ struct lp_build_tgsi_context *bld_base,
+ struct lp_build_emit_data *emit_data) {
+ struct lp_build_context *uint_bld = &bld_base->uint_bld;
+ emit_data->output[emit_data->chan] =
+ lp_build_bitfield_reverse(uint_bld, emit_data->args[0]);
+}
void
lp_set_default_actions_cpu(
@@ -2507,4 +2635,14 @@ lp_set_default_actions_cpu(
bld_base->op_actions[TGSI_OPCODE_U64SHL].emit = u64shl_emit_cpu;
bld_base->op_actions[TGSI_OPCODE_I64SHR].emit = i64shr_emit_cpu;
bld_base->op_actions[TGSI_OPCODE_U64SHR].emit = u64shr_emit_cpu;
+
+ bld_base->op_actions[TGSI_OPCODE_BFI].emit = bfi_emit_cpu;
+ bld_base->op_actions[TGSI_OPCODE_POPC].emit = popc_emit_cpu;
+ bld_base->op_actions[TGSI_OPCODE_LSB].emit = lsb_emit_cpu;
+ bld_base->op_actions[TGSI_OPCODE_IMSB].emit = imsb_emit_cpu;
+ bld_base->op_actions[TGSI_OPCODE_UMSB].emit = umsb_emit_cpu;
+ bld_base->op_actions[TGSI_OPCODE_IBFE].emit = ibfe_emit_cpu;
+ bld_base->op_actions[TGSI_OPCODE_UBFE].emit = ubfe_emit_cpu;
+ bld_base->op_actions[TGSI_OPCODE_BREV].emit = brev_emit_cpu;
+
}