diff options
author | Brian <[email protected]> | 2007-01-27 20:06:41 -0700 |
---|---|---|
committer | Brian <[email protected]> | 2007-01-27 20:06:41 -0700 |
commit | d6772f157a56bb53b754bb16c98e102b54c82a0e (patch) | |
tree | d0d0c1f8b7e134d55453567072c0a7acb44c5f63 /src/mesa/shader/slang/slang_vartable.c | |
parent | ea8b68e0f7e7a4025ce662d36380157273ce10a3 (diff) |
Improved register allocation: allow four 'float' vars or temporaries to share a single register. Clean-up needed.
Diffstat (limited to 'src/mesa/shader/slang/slang_vartable.c')
-rw-r--r-- | src/mesa/shader/slang/slang_vartable.c | 140 |
1 files changed, 100 insertions, 40 deletions
diff --git a/src/mesa/shader/slang/slang_vartable.c b/src/mesa/shader/slang/slang_vartable.c index 6d2b4369d94..cadefda1bca 100644 --- a/src/mesa/shader/slang/slang_vartable.c +++ b/src/mesa/shader/slang/slang_vartable.c @@ -4,6 +4,7 @@ #include "slang_compile_variable.h" #include "slang_vartable.h" #include "slang_ir.h" +#include "prog_instruction.h" static int dbg = 0; @@ -23,7 +24,8 @@ struct slang_var_table_ int num_entries; slang_variable **vars; /* array [num_entries] */ - TempState temps[MAX_PROGRAM_TEMPS]; + TempState temps[MAX_PROGRAM_TEMPS * 4]; + int size[MAX_PROGRAM_TEMPS]; struct slang_var_table_ *parent; }; @@ -46,6 +48,7 @@ _slang_push_var_table(slang_var_table *parent) if (parent) { /* copy the info indicating which temp regs are in use */ memcpy(t->temps, parent->temps, sizeof(t->temps)); + memcpy(t->size, parent->size, sizeof(t->size)); } if (dbg) printf("Pushing level %d\n", t->level); } @@ -67,12 +70,22 @@ _slang_pop_var_table(slang_var_table *t) /* free the storage allocated for each variable */ for (i = 0; i < t->num_entries; i++) { slang_ir_storage *store = (slang_ir_storage *) t->vars[i]->aux; - GLint j, sz4 = (store->Size + 3) / 4; - if (dbg) printf(" Free var %s, size %d\n", - (char*) t->vars[i]->a_name, store->Size); - for (j = 0; j < sz4; j++) { - assert(t->temps[store->Index + j] == VAR); - t->temps[store->Index + j] = FREE; + GLint j; + const GLuint sz = store->Size; + GLuint comp; + if (dbg) printf(" Free var %s, size %d at %d\n", + (char*) t->vars[i]->a_name, store->Size, + store->Index); + + if (sz == 1) + comp = GET_SWZ(store->Swizzle, 0); + else + comp = 0; + + assert(store->Index >= 0); + for (j = 0; j < sz; j++) { + assert(t->temps[store->Index * 4 + j + comp] == VAR); + t->temps[store->Index * 4 + j + comp] = FREE; } store->Index = -1; } @@ -80,9 +93,9 @@ _slang_pop_var_table(slang_var_table *t) /* just verify that any remaining allocations in this scope * were for temps */ - for (i = 0; i < MAX_PROGRAM_TEMPS; i++) { + for (i = 0; i < MAX_PROGRAM_TEMPS * 4; i++) { if (t->temps[i] && !t->parent->temps[i]) { - if (dbg) printf(" Free reg %d\n", i); + if (dbg) printf(" Free reg %d\n", i/4); assert(t->temps[i] == TEMP); } } @@ -131,16 +144,22 @@ _slang_find_variable(const slang_var_table *t, slang_atom name) } +/** + * Allocation helper. + * \param size var size in floats + * \return position for var, measured in floats + */ static GLint alloc_reg(slang_var_table *t, GLint size, GLboolean isTemp) { - const GLuint sz4 = (size + 3) / 4; + /* if size == 1, allocate anywhere, else, pos must be multiple of 4 */ + const GLuint step = (size == 1) ? 1 : 4; GLuint i, j; assert(size > 0); /* number of floats */ - for (i = 0; i < MAX_PROGRAM_TEMPS; i++) { + for (i = 0; i < MAX_PROGRAM_TEMPS - size; i += step) { GLuint found = 0; - for (j = 0; j < sz4; j++) { + for (j = 0; j < size; j++) { if (i + j < MAX_PROGRAM_TEMPS && !t->temps[i + j]) { found++; } @@ -148,10 +167,14 @@ alloc_reg(slang_var_table *t, GLint size, GLboolean isTemp) break; } } - if (found == sz4) { - /* found block of size/4 free regs */ - for (j = 0; j < sz4; j++) + if (found == size) { + /* found block of size free regs */ + if (size > 1) + assert(i % 4 == 0); + for (j = 0; j < size; j++) t->temps[i + j] = isTemp ? TEMP : VAR; + printf("t->size[%d] = %d\n", i, size); + t->size[i] = size; return i; } } @@ -161,61 +184,98 @@ alloc_reg(slang_var_table *t, GLint size, GLboolean isTemp) /** * Allocate temp register(s) for storing a variable. + * \param size size needed, in floats + * \param swizzle returns swizzle mask for accessing var in register + * \return register allocated, or -1 */ GLint -_slang_alloc_var(slang_var_table *t, GLint size) +_slang_alloc_var(slang_var_table *t, GLint size, GLuint *swizzle) { int i = alloc_reg(t, size, GL_FALSE); - if (dbg) printf("Alloc var %d (level %d)\n", i, t->level); - return i; -} - - -void -_slang_reserve_var(slang_var_table *t, GLint r, GLint size) -{ - const GLint sz4 = (size + 3) / 4; - GLint i; - for (i = 0; i < sz4; i++) { - t->temps[r + i] = VAR; + if (i < 0) + return -1; + + if (size == 1) { + GLuint comp = i % 4; + *swizzle = MAKE_SWIZZLE4(comp, comp, comp, comp); + char swz = "xyzw"[comp]; + if (dbg) printf("Alloc var sz %d at %d.%c (level %d)\n", size, i/4, swz, t->level); } + else { + *swizzle = SWIZZLE_NOOP; + if (dbg) printf("Alloc var sz %d at %d.xyzw (level %d)\n", size, i/4, t->level); + } + return i / 4; } + /** * Allocate temp register(s) for storing an unnamed intermediate value. */ GLint -_slang_alloc_temp(slang_var_table *t, GLint size) +_slang_alloc_temp(slang_var_table *t, GLint size, GLuint *swizzle) { int i = alloc_reg(t, size, GL_TRUE); - if (dbg) printf("Alloc temp %d (level %d)\n", i, t->level); - return i; + if (i < 0) + return -1; + + if (size == 1) { + GLuint comp = i % 4; + assert(comp < 4); + int swz = "xyzw"[comp]; + *swizzle = MAKE_SWIZZLE4(comp, comp, comp, comp); + if (dbg) printf("Alloc temp sz %d at %d.%c (level %d)\n", + size, i/4, swz, t->level); + } + else { + *swizzle = SWIZZLE_NOOP; + if (dbg) printf("Alloc temp sz %d at %d.xyzw (level %d)\n", + size, i/4, t->level); + } + return i / 4; } void -_slang_free_temp(slang_var_table *t, GLint r, GLint size) +_slang_free_temp(slang_var_table *t, GLint r, GLint size, GLuint swizzle) { - const GLuint sz4 = (size + 3) / 4; GLuint i; assert(size > 0); assert(r >= 0); - assert(r < MAX_PROGRAM_TEMPS); - if (dbg) printf("Free temp %d (level %d)\n", r, t->level); - for (i = 0; i < sz4; i++) { - assert(t->temps[r + i] == TEMP); - t->temps[r + i] = FREE; + assert(r + size <= MAX_PROGRAM_TEMPS); + if (dbg) printf("Free temp sz %d at %d (level %d)\n", size, r, t->level); + if (size == 1) { + GLuint comp = GET_SWZ(swizzle, 0); + assert(swizzle == MAKE_SWIZZLE4(comp, comp, comp, comp)); + assert(comp < 4); + assert(t->size[r * 4 + comp] == 1); + assert(t->temps[r * 4 + comp] == TEMP); + t->temps[r * 4 + comp] = FREE; + } + else { + assert(swizzle == SWIZZLE_NOOP); + assert(t->size[r*4] == size); + for (i = 0; i < size; i++) { + assert(t->temps[r * 4 + i] == TEMP); + t->temps[r * 4 + i] = FREE; + } } } GLboolean -_slang_is_temp(slang_var_table *t, GLint r) +_slang_is_temp(slang_var_table *t, GLint r, GLuint swizzle) { assert(r >= 0); assert(r < MAX_PROGRAM_TEMPS); - if (t->temps[r] == TEMP) + GLuint comp; + if (swizzle == SWIZZLE_NOOP) + comp = 0; + else + comp = GET_SWZ(swizzle, 0); + + if (t->temps[r * 4 + comp] == TEMP) return GL_TRUE; else return GL_FALSE; |