diff options
author | Ian Romanick <[email protected]> | 2016-12-15 14:26:24 -0800 |
---|---|---|
committer | Ian Romanick <[email protected]> | 2016-12-19 15:55:43 -0800 |
commit | d32956935edf06c8ae6872c707bc65187b4a1d15 (patch) | |
tree | d796b8c3644d6d375caea13725ffe922ba87dcaf /src/compiler/glsl | |
parent | e92935089bd9a987027d1f0791e7298bb3a57113 (diff) |
glsl: Walk a list of ir_dereference_array to mark array elements as accessed
Signed-off-by: Ian Romanick <[email protected]>
Cc: [email protected]
Reviewed-by: Kenneth Graunke <[email protected]>
Diffstat (limited to 'src/compiler/glsl')
-rw-r--r-- | src/compiler/glsl/ir_array_refcount.cpp | 73 | ||||
-rw-r--r-- | src/compiler/glsl/ir_array_refcount.h | 10 | ||||
-rw-r--r-- | src/compiler/glsl/tests/array_refcount_test.cpp | 425 |
3 files changed, 507 insertions, 1 deletions
diff --git a/src/compiler/glsl/ir_array_refcount.cpp b/src/compiler/glsl/ir_array_refcount.cpp index 7627fa13bd2..1a46b2185d4 100644 --- a/src/compiler/glsl/ir_array_refcount.cpp +++ b/src/compiler/glsl/ir_array_refcount.cpp @@ -34,7 +34,7 @@ #include "util/hash_table.h" ir_array_refcount_visitor::ir_array_refcount_visitor() - : derefs(0), num_derefs(0), derefs_size(0) + : last_array_deref(0), derefs(0), num_derefs(0), derefs_size(0) { this->mem_ctx = ralloc_context(NULL); this->ht = _mesa_hash_table_create(NULL, _mesa_hash_pointer, @@ -159,6 +159,77 @@ ir_array_refcount_visitor::get_array_deref() return d; } +ir_visitor_status +ir_array_refcount_visitor::visit_enter(ir_dereference_array *ir) +{ + /* It could also be a vector or a matrix. Individual elements of vectors + * are natrices are not tracked, so bail. + */ + if (!ir->array->type->is_array()) + return visit_continue; + + /* If this array dereference is a child of an array dereference that was + * already visited, just continue on. Otherwise, for an arrays-of-arrays + * dereference like x[1][2][3][4], we'd process the [1][2][3][4] sequence, + * the [1][2][3] sequence, the [1][2] sequence, and the [1] sequence. This + * ensures that we only process the full sequence. + */ + if (last_array_deref && last_array_deref->array == ir) { + last_array_deref = ir; + return visit_continue; + } + + last_array_deref = ir; + + num_derefs = 0; + + ir_rvalue *rv = ir; + while (rv->ir_type == ir_type_dereference_array) { + ir_dereference_array *const deref = rv->as_dereference_array(); + + assert(deref != NULL); + assert(deref->array->type->is_array()); + + ir_rvalue *const array = deref->array; + const ir_constant *const idx = deref->array_index->as_constant(); + array_deref_range *const dr = get_array_deref(); + + dr->size = array->type->array_size(); + + if (idx != NULL) { + dr->index = idx->get_int_component(0); + } else { + /* An unsized array can occur at the end of an SSBO. We can't track + * accesses to such an array, so bail. + */ + if (array->type->array_size() == 0) + return visit_continue; + + dr->index = dr->size; + } + + rv = array; + } + + ir_dereference_variable *const var_deref = rv->as_dereference_variable(); + + /* If the array being dereferenced is not a variable, bail. At the very + * least, ir_constant and ir_dereference_record are possible. + */ + if (var_deref == NULL) + return visit_continue; + + ir_array_refcount_entry *const entry = + this->get_variable_entry(var_deref->var); + + if (entry == NULL) + return visit_stop; + + entry->mark_array_elements_referenced(derefs, num_derefs); + + return visit_continue; +} + ir_visitor_status ir_array_refcount_visitor::visit(ir_dereference_variable *ir) diff --git a/src/compiler/glsl/ir_array_refcount.h b/src/compiler/glsl/ir_array_refcount.h index 2988046aaed..46ba36cbaa0 100644 --- a/src/compiler/glsl/ir_array_refcount.h +++ b/src/compiler/glsl/ir_array_refcount.h @@ -140,6 +140,7 @@ public: virtual ir_visitor_status visit(ir_dereference_variable *); virtual ir_visitor_status visit_enter(ir_function_signature *); + virtual ir_visitor_status visit_enter(ir_dereference_array *); /** * Find variable in the hash table, and insert it if not present @@ -158,6 +159,15 @@ private: array_deref_range *get_array_deref(); /** + * Last ir_dereference_array that was visited + * + * Used to prevent some redundant calculations. + * + * \sa ::visit_enter(ir_dereference_array *) + */ + ir_dereference_array *last_array_deref; + + /** * \name array_deref_range tracking */ /*@{*/ diff --git a/src/compiler/glsl/tests/array_refcount_test.cpp b/src/compiler/glsl/tests/array_refcount_test.cpp index 29bb133e231..ecd7f46900b 100644 --- a/src/compiler/glsl/tests/array_refcount_test.cpp +++ b/src/compiler/glsl/tests/array_refcount_test.cpp @@ -23,12 +23,18 @@ #include <gtest/gtest.h> #include "ir.h" #include "ir_array_refcount.h" +#include "ir_builder.h" +#include "util/hash_table.h" + +using namespace ir_builder; class array_refcount_test : public ::testing::Test { public: virtual void SetUp(); virtual void TearDown(); + exec_list instructions; + ir_factory *body; void *mem_ctx; /** @@ -40,6 +46,14 @@ public: const glsl_type *array_3_of_array_4_of_array_5_of_vec4; /** + * glsl_type for a int[3]. + * + * The exceptionally verbose name is picked because it matches the syntax + * of http://cdecl.org/. + */ + const glsl_type *array_3_of_int; + + /** * Wrapper to access private member "bits" of ir_array_refcount_entry * * The test class is a friend to ir_array_refcount_entry, but the @@ -81,6 +95,9 @@ array_refcount_test::SetUp() { mem_ctx = ralloc_context(NULL); + instructions.make_empty(); + body = new ir_factory(&instructions, mem_ctx); + /* The type of vec4 x[3][4][5]; */ const glsl_type *const array_5_of_vec4 = glsl_type::get_array_instance(glsl_type::vec4_type, 5); @@ -88,15 +105,105 @@ array_refcount_test::SetUp() glsl_type::get_array_instance(array_5_of_vec4, 4); array_3_of_array_4_of_array_5_of_vec4 = glsl_type::get_array_instance(array_4_of_array_5_of_vec4, 3); + + array_3_of_int = glsl_type::get_array_instance(glsl_type::int_type, 3); } void array_refcount_test::TearDown() { + delete body; + body = NULL; + ralloc_free(mem_ctx); mem_ctx = NULL; } +static operand +deref_array(operand array, operand index) +{ + void *mem_ctx = ralloc_parent(array.val); + + ir_rvalue *val = new(mem_ctx) ir_dereference_array(array.val, index.val); + + return operand(val); +} + +static operand +deref_struct(operand s, const char *field) +{ + void *mem_ctx = ralloc_parent(s.val); + + ir_rvalue *val = new(mem_ctx) ir_dereference_record(s.val, field); + + return operand(val); +} + +/** + * Verify that only the specified set of ir_variables exists in the hash table + */ +static void +validate_variables_in_hash_table(struct hash_table *ht, + unsigned count, + ...) +{ + ir_variable **vars = new ir_variable *[count]; + va_list args; + + /* Make a copy of the list of expected ir_variables. The copied list can + * be modified during the checking. + */ + va_start(args, count); + + for (unsigned i = 0; i < count; i++) + vars[i] = va_arg(args, ir_variable *); + + va_end(args); + + struct hash_entry *entry; + hash_table_foreach(ht, entry) { + const ir_instruction *const ir = (ir_instruction *) entry->key; + const ir_variable *const v = ir->as_variable(); + + if (v == NULL) { + ADD_FAILURE() << "Invalid junk in hash table: ir_type = " + << ir->ir_type << ", address = " + << (void *) ir; + continue; + } + + unsigned i; + for (i = 0; i < count; i++) { + if (vars[i] == NULL) + continue; + + if (vars[i] == v) + break; + } + + if (i == count) { + ADD_FAILURE() << "Invalid variable in hash table: \"" + << v->name << "\""; + } else { + /* As each variable is encountered, remove it from the set. Don't + * bother compacting the set because we don't care about + * performance here. + */ + vars[i] = NULL; + } + } + + /* Check that there's nothing left in the set. */ + for (unsigned i = 0; i < count; i++) { + if (vars[i] != NULL) { + ADD_FAILURE() << "Variable was not in the hash table: \"" + << vars[i]->name << "\""; + } + } + + delete [] vars; +} + TEST_F(array_refcount_test, ir_array_refcount_entry_initial_state_for_scalar) { ir_variable *const var = @@ -290,3 +397,321 @@ TEST_F(array_refcount_test, mark_array_elements_referenced_whole_first_and_third } } } + +TEST_F(array_refcount_test, do_not_process_vector_indexing) +{ + /* Vectors and matrices can also be indexed in much the same manner as + * arrays. The visitor should not try to track per-element accesses to + * these types. + */ + ir_variable *var_a = new(mem_ctx) ir_variable(glsl_type::float_type, + "a", + ir_var_auto); + ir_variable *var_b = new(mem_ctx) ir_variable(glsl_type::int_type, + "b", + ir_var_auto); + ir_variable *var_c = new(mem_ctx) ir_variable(glsl_type::vec4_type, + "c", + ir_var_auto); + + body->emit(assign(var_a, deref_array(var_c, var_b))); + + ir_array_refcount_visitor v; + + visit_list_elements(&v, &instructions); + + ir_array_refcount_entry *entry_a = v.get_variable_entry(var_a); + ir_array_refcount_entry *entry_b = v.get_variable_entry(var_b); + ir_array_refcount_entry *entry_c = v.get_variable_entry(var_c); + + EXPECT_TRUE(entry_a->is_referenced); + EXPECT_TRUE(entry_b->is_referenced); + EXPECT_TRUE(entry_c->is_referenced); + + /* As validated by previous tests, for non-array types, num_bits is 1. */ + ASSERT_EQ(1, get_num_bits(*entry_c)); + EXPECT_FALSE(entry_c->is_linearized_index_referenced(0)); +} + +TEST_F(array_refcount_test, do_not_process_matrix_indexing) +{ + /* Vectors and matrices can also be indexed in much the same manner as + * arrays. The visitor should not try to track per-element accesses to + * these types. + */ + ir_variable *var_a = new(mem_ctx) ir_variable(glsl_type::vec4_type, + "a", + ir_var_auto); + ir_variable *var_b = new(mem_ctx) ir_variable(glsl_type::int_type, + "b", + ir_var_auto); + ir_variable *var_c = new(mem_ctx) ir_variable(glsl_type::mat4_type, + "c", + ir_var_auto); + + body->emit(assign(var_a, deref_array(var_c, var_b))); + + ir_array_refcount_visitor v; + + visit_list_elements(&v, &instructions); + + ir_array_refcount_entry *entry_a = v.get_variable_entry(var_a); + ir_array_refcount_entry *entry_b = v.get_variable_entry(var_b); + ir_array_refcount_entry *entry_c = v.get_variable_entry(var_c); + + EXPECT_TRUE(entry_a->is_referenced); + EXPECT_TRUE(entry_b->is_referenced); + EXPECT_TRUE(entry_c->is_referenced); + + /* As validated by previous tests, for non-array types, num_bits is 1. */ + ASSERT_EQ(1, get_num_bits(*entry_c)); + EXPECT_FALSE(entry_c->is_linearized_index_referenced(0)); +} + +TEST_F(array_refcount_test, do_not_process_array_inside_structure) +{ + /* Structures can contain arrays. The visitor should not try to track + * per-element accesses to arrays contained inside structures. + */ + const glsl_struct_field fields[] = { + glsl_struct_field(array_3_of_int, "i"), + }; + + const glsl_type *const record_of_array_3_of_int = + glsl_type::get_record_instance(fields, ARRAY_SIZE(fields), "S"); + + ir_variable *var_a = new(mem_ctx) ir_variable(glsl_type::int_type, + "a", + ir_var_auto); + + ir_variable *var_b = new(mem_ctx) ir_variable(record_of_array_3_of_int, + "b", + ir_var_auto); + + /* a = b.i[2] */ + body->emit(assign(var_a, + deref_array( + deref_struct(var_b, "i"), + body->constant(int(2))))); + + ir_array_refcount_visitor v; + + visit_list_elements(&v, &instructions); + + ir_array_refcount_entry *entry_a = v.get_variable_entry(var_a); + ir_array_refcount_entry *entry_b = v.get_variable_entry(var_b); + + EXPECT_TRUE(entry_a->is_referenced); + EXPECT_TRUE(entry_b->is_referenced); + + ASSERT_EQ(1, get_num_bits(*entry_b)); + EXPECT_FALSE(entry_b->is_linearized_index_referenced(0)); + + validate_variables_in_hash_table(v.ht, 2, var_a, var_b); +} + +TEST_F(array_refcount_test, visit_simple_indexing) +{ + ir_variable *var_a = new(mem_ctx) ir_variable(glsl_type::vec4_type, + "a", + ir_var_auto); + ir_variable *var_b = new(mem_ctx) ir_variable(array_3_of_array_4_of_array_5_of_vec4, + "b", + ir_var_auto); + + /* a = b[2][1][0] */ + body->emit(assign(var_a, + deref_array( + deref_array( + deref_array(var_b, body->constant(int(2))), + body->constant(int(1))), + body->constant(int(0))))); + + ir_array_refcount_visitor v; + + visit_list_elements(&v, &instructions); + + const unsigned accessed_element = 0 + (1 * 5) + (2 * 4 * 5); + ir_array_refcount_entry *entry_b = v.get_variable_entry(var_b); + const unsigned total_elements = var_b->type->arrays_of_arrays_size(); + + for (unsigned i = 0; i < total_elements; i++) + EXPECT_EQ(i == accessed_element, entry_b->is_linearized_index_referenced(i)) << + "i = " << i; + + validate_variables_in_hash_table(v.ht, 2, var_a, var_b); +} + +TEST_F(array_refcount_test, visit_whole_second_array_indexing) +{ + ir_variable *var_a = new(mem_ctx) ir_variable(glsl_type::vec4_type, + "a", + ir_var_auto); + ir_variable *var_b = new(mem_ctx) ir_variable(array_3_of_array_4_of_array_5_of_vec4, + "b", + ir_var_auto); + ir_variable *var_i = new(mem_ctx) ir_variable(glsl_type::int_type, + "i", + ir_var_auto); + + /* a = b[2][i][1] */ + body->emit(assign(var_a, + deref_array( + deref_array( + deref_array(var_b, body->constant(int(2))), + var_i), + body->constant(int(1))))); + + ir_array_refcount_visitor v; + + visit_list_elements(&v, &instructions); + + ir_array_refcount_entry *const entry_b = v.get_variable_entry(var_b); + for (unsigned i = 0; i < 3; i++) { + for (unsigned j = 0; j < 4; j++) { + for (unsigned k = 0; k < 5; k++) { + const bool accessed = (i == 2) && (k == 1); + const unsigned linearized_index = k + (j * 5) + (i * 4 * 5); + + EXPECT_EQ(accessed, + entry_b->is_linearized_index_referenced(linearized_index)) << + "i = " << i; + } + } + } + + validate_variables_in_hash_table(v.ht, 3, var_a, var_b, var_i); +} + +TEST_F(array_refcount_test, visit_array_indexing_an_array) +{ + ir_variable *var_a = new(mem_ctx) ir_variable(glsl_type::vec4_type, + "a", + ir_var_auto); + ir_variable *var_b = new(mem_ctx) ir_variable(array_3_of_array_4_of_array_5_of_vec4, + "b", + ir_var_auto); + ir_variable *var_c = new(mem_ctx) ir_variable(array_3_of_int, + "c", + ir_var_auto); + ir_variable *var_i = new(mem_ctx) ir_variable(glsl_type::int_type, + "i", + ir_var_auto); + + /* a = b[2][3][c[i]] */ + body->emit(assign(var_a, + deref_array( + deref_array( + deref_array(var_b, body->constant(int(2))), + body->constant(int(3))), + deref_array(var_c, var_i)))); + + ir_array_refcount_visitor v; + + visit_list_elements(&v, &instructions); + + ir_array_refcount_entry *const entry_b = v.get_variable_entry(var_b); + + for (unsigned i = 0; i < 3; i++) { + for (unsigned j = 0; j < 4; j++) { + for (unsigned k = 0; k < 5; k++) { + const bool accessed = (i == 2) && (j == 3); + const unsigned linearized_index = k + (j * 5) + (i * 4 * 5); + + EXPECT_EQ(accessed, + entry_b->is_linearized_index_referenced(linearized_index)) << + "array b[" << i << "][" << j << "][" << k << "], " << + "linear index = " << linearized_index; + } + } + } + + ir_array_refcount_entry *const entry_c = v.get_variable_entry(var_c); + + for (unsigned i = 0; i < var_c->type->array_size(); i++) { + EXPECT_EQ(true, entry_c->is_linearized_index_referenced(i)) << + "array c, i = " << i; + } + + validate_variables_in_hash_table(v.ht, 4, var_a, var_b, var_c, var_i); +} + +TEST_F(array_refcount_test, visit_array_indexing_with_itself) +{ + const glsl_type *const array_2_of_array_3_of_int = + glsl_type::get_array_instance(array_3_of_int, 2); + + const glsl_type *const array_2_of_array_2_of_array_3_of_int = + glsl_type::get_array_instance(array_2_of_array_3_of_int, 2); + + ir_variable *var_a = new(mem_ctx) ir_variable(glsl_type::int_type, + "a", + ir_var_auto); + ir_variable *var_b = new(mem_ctx) ir_variable(array_2_of_array_2_of_array_3_of_int, + "b", + ir_var_auto); + + /* Given GLSL code: + * + * int b[2][2][3]; + * a = b[ b[0][0][0] ][ b[ b[0][1][0] ][ b[1][0][0] ][1] ][2] + * + * b[0][0][0], b[0][1][0], and b[1][0][0] are trivially accessed. + * + * b[*][*][1] and b[*][*][2] are accessed. + * + * Only b[1][1][0] is not accessed. + */ + operand b000 = deref_array( + deref_array( + deref_array(var_b, body->constant(int(0))), + body->constant(int(0))), + body->constant(int(0))); + + operand b010 = deref_array( + deref_array( + deref_array(var_b, body->constant(int(0))), + body->constant(int(1))), + body->constant(int(0))); + + operand b100 = deref_array( + deref_array( + deref_array(var_b, body->constant(int(1))), + body->constant(int(0))), + body->constant(int(0))); + + operand b_b010_b100_1 = deref_array( + deref_array( + deref_array(var_b, b010), + b100), + body->constant(int(1))); + + body->emit(assign(var_a, + deref_array( + deref_array( + deref_array(var_b, b000), + b_b010_b100_1), + body->constant(int(2))))); + + ir_array_refcount_visitor v; + + visit_list_elements(&v, &instructions); + + ir_array_refcount_entry *const entry_b = v.get_variable_entry(var_b); + + for (unsigned i = 0; i < 2; i++) { + for (unsigned j = 0; j < 2; j++) { + for (unsigned k = 0; k < 3; k++) { + const bool accessed = !(i == 1 && j == 1 && k == 0); + const unsigned linearized_index = k + (j * 3) + (i * 2 * 3); + + EXPECT_EQ(accessed, + entry_b->is_linearized_index_referenced(linearized_index)) << + "array b[" << i << "][" << j << "][" << k << "], " << + "linear index = " << linearized_index; + } + } + } + + validate_variables_in_hash_table(v.ht, 2, var_a, var_b); +} |