diff options
author | Rhys Perry <[email protected]> | 2020-04-06 11:15:00 +0100 |
---|---|---|
committer | Rhys Perry <[email protected]> | 2020-04-24 20:03:59 +0100 |
commit | eeccb1a941e258190b5ba7a425f65599873f92ed (patch) | |
tree | 6247f079bd9ee76ea35a352f82bd658cb5176541 /src | |
parent | bcd9467d5cc11709d8c6fcbbcebd90f7e5255533 (diff) |
aco: lower 8/16-bit integer arithmetic
dEQP-VK.spirv_assembly.type.* passes with the features and extensions
enabled.
Signed-off-by: Rhys Perry <[email protected]>
Reviewed-by: Daniel Schürmann <[email protected]>
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/4707>
Diffstat (limited to 'src')
-rw-r--r-- | src/amd/compiler/aco_instruction_selection_setup.cpp | 31 |
1 files changed, 31 insertions, 0 deletions
diff --git a/src/amd/compiler/aco_instruction_selection_setup.cpp b/src/amd/compiler/aco_instruction_selection_setup.cpp index 14d08ff7153..80280319673 100644 --- a/src/amd/compiler/aco_instruction_selection_setup.cpp +++ b/src/amd/compiler/aco_instruction_selection_setup.cpp @@ -1018,6 +1018,34 @@ get_io_masks(isel_context *ctx, unsigned shader_count, struct nir_shader *const } } +unsigned +lower_bit_size_callback(const nir_alu_instr *alu, void *_) +{ + if (nir_op_is_vec(alu->op)) + return 0; + + unsigned bit_size = alu->dest.dest.ssa.bit_size; + if (nir_alu_instr_is_comparison(alu)) + bit_size = nir_src_bit_size(alu->src[0].src); + + if (bit_size >= 32 || bit_size == 1) + return 0; + + if (alu->op == nir_op_bcsel) + return 0; + + const nir_op_info *info = &nir_op_infos[alu->op]; + + if (info->is_conversion) + return 0; + + bool is_integer = info->output_type & (nir_type_uint | nir_type_int); + for (unsigned i = 0; is_integer && (i < info->num_inputs); i++) + is_integer = info->input_types[i] & (nir_type_uint | nir_type_int); + + return is_integer ? 32 : 0; +} + void setup_nir(isel_context *ctx, nir_shader *nir) { @@ -1062,6 +1090,9 @@ setup_nir(isel_context *ctx, nir_shader *nir) // TODO: implement logic64 in aco, it's more effective for sgprs nir_lower_int64(nir, nir->options->lower_int64_options); + if (nir_lower_bit_size(nir, lower_bit_size_callback, NULL)) + nir_copy_prop(nir); /* allow nir_opt_idiv_const() to optimize lowered divisions */ + nir_opt_idiv_const(nir, 32); nir_lower_idiv(nir, nir_lower_idiv_precise); |