diff options
Diffstat (limited to 'src/mesa/tnl/t_vertex_codegen.c')
-rw-r--r-- | src/mesa/tnl/t_vertex_codegen.c | 509 |
1 files changed, 509 insertions, 0 deletions
diff --git a/src/mesa/tnl/t_vertex_codegen.c b/src/mesa/tnl/t_vertex_codegen.c new file mode 100644 index 00000000000..3c99b0411ea --- /dev/null +++ b/src/mesa/tnl/t_vertex_codegen.c @@ -0,0 +1,509 @@ +/* + * Copyright 2003 Tungsten Graphics, inc. + * All Rights Reserved. + * + * Permission is hereby granted, free of charge, to any person obtaining a + * copy of this software and associated documentation files (the "Software"), + * to deal in the Software without restriction, including without limitation + * on the rights to use, copy, modify, merge, publish, distribute, sub + * license, and/or sell copies of the Software, and to permit persons to whom + * the Software is furnished to do so, subject to the following conditions: + * + * The above copyright notice and this permission notice (including the next + * paragraph) shall be included in all copies or substantial portions of the + * Software. + * + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, + * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL + * TUNGSTEN GRAPHICS AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM, + * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR + * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE + * USE OR OTHER DEALINGS IN THE SOFTWARE. + * + * Authors: + * Keith Whitwell <[email protected]> + */ + +#include "glheader.h" +#include "context.h" +#include "colormac.h" + +#include "t_context.h" +#include "t_vertex.h" + +#include "simple_list.h" + +/* Another codegen scheme, hopefully portable to a few different + * architectures without too much work. + */ + + + + +static GLboolean emit_4f_viewport_4( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mad(p, out(0), vp(0), in(0), vp(12)) && + p->emit_mad(p, out(1), vp(5), in(1), vp(13)) && + p->emit_mad(p, out(2), vp(10), in(2), vp(14)) && + p->emit_mov(p, out(3), in(3)); +} + +static GLboolean emit_4f_viewport_3( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mad(p, out(0), vp(0), in(0), vp(12)) && + p->emit_mad(p, out(1), vp(5), in(1), vp(13)) && + p->emit_mad(p, out(2), vp(10), in(2), vp(14)) && + p->emit_const(p, out(3), 1.0); +} + +static GLboolean emit_4f_viewport_2( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mad(p, out(0), vp(0), in(0), vp(12)) && + p->emit_mad(p, out(1), vp(5), in(1), vp(13)) && + p->emit_mov(p, out(2), vp(14)) && + p->emit_const(p, out(3), 1.0); +} + +static GLboolean emit_4f_viewport_1( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mad(p, out(0), vp(0), in(0), vp(12)) && + p->emit_mov(p, out(1), vp(13)) && + p->emit_mov(p, out(2), vp(14)) && + p->emit_const(p, out(3), 1.0); +} + +static GLboolean emit_3f_viewport_3( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mad(p, out(0), vp(0), in(0), vp(12)) && + p->emit_mad(p, out(1), vp(5), in(1), vp(13)) && + p->emit_mad(p, out(2), vp(10), in(2), vp(14)); +} + +static GLboolean emit_3f_viewport_2( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mad(p, out(0), vp(0), in(0), vp(12)) && + p->emit_mad(p, out(1), vp(5), in(1), vp(13)) && + p->emit_mov(p, out(2), vp(14)); +} + +static GLboolean emit_3f_viewport_1( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mad(p, out(0), vp(0), in(0), vp(12)) && + p->emit_mov(p, out(1), vp(13)) && + p->emit_mov(p, out(2), vp(14)); +} + +static GLboolean emit_2f_viewport_2( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mad(p, out(0), vp(0), in(0), vp(12)) && + p->emit_mad(p, out(1), vp(5), in(1), vp(13)); +} + +static GLboolean emit_2f_viewport_1( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mad(p, out(0), vp(0), in(0), vp(12)); +} + + +static GLboolean emit_4f_4( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mov(p, out(0), in(0)) && + p->emit_mov(p, out(1), in(1)) && + p->emit_mov(p, out(2), in(2)) && + p->emit_mov(p, out(3), in(3)); +} + +static GLboolean emit_4f_3( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mov(p, out(0), in(0)) && + p->emit_mov(p, out(1), in(1)) && + p->emit_mov(p, out(2), in(2)) && + p->emit_const(p, out(3), 1.0); +} + +static GLboolean emit_4f_2( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mov(p, out(0), in(0)) && + p->emit_mov(p, out(1), in(1)) && + p->emit_const(p, out(2), 0.0) && + p->emit_const(p, out(3), 1.0); +} + +static GLboolean emit_4f_1( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mov(p, out(0), in(0)) && + p->emit_const(p, out(1), 0.0) && + p->emit_const(p, out(2), 0.0) && + p->emit_const(p, out(3), 1.0); +} + +static GLboolean emit_3f_xyw_4( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mov(p, out(0), in(0)) && + p->emit_mov(p, out(1), in(1)) && + p->emit_mov(p, out(2), in(3)); +} + +static GLboolean emit_3f_xyw_err( struct tnl_clipspace_codegen *p ) +{ + assert(0); + return GL_FALSE; +} + +static GLboolean emit_3f_3( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mov(p, out(0), in(0)) && + p->emit_mov(p, out(1), in(1)) && + p->emit_mov(p, out(2), in(2)); +} + +static GLboolean emit_3f_2( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mov(p, out(0), in(0)) && + p->emit_mov(p, out(1), in(1)) && + p->emit_const(p, out(2), 0.0); +} + +static GLboolean emit_3f_1( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mov(p, out(0), in(0)) && + p->emit_const(p, out(1), 0.0) && + p->emit_const(p, out(2), 0.0); +} + + +static GLboolean emit_2f_2( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mov(p, out(0), in(0)) && + p->emit_mov(p, out(1), in(1)); +} + +static GLboolean emit_2f_1( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mov(p, out(0), in(0)) && + p->emit_const(p, out(1), 0.0); +} + +static GLboolean emit_1f_1( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_mov(p, out(0), in(0)); +} + +static GLboolean emit_4chan_4f_rgba_4( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_chan(p, out(0), in(0)) && + p->emit_float_to_chan(p, out(1), in(1)) && + p->emit_float_to_chan(p, out(2), in(2)) && + p->emit_float_to_chan(p, out(3), in(3)); +} + +static GLboolean emit_4chan_4f_rgba_3( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_chan(p, out(0), in(0)) && + p->emit_float_to_chan(p, out(1), in(1)) && + p->emit_float_to_chan(p, out(2), in(2)) && + p->emit_const_chan(p, out(3), CHAN_MAX); +} + +static GLboolean emit_4chan_4f_rgba_2( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_chan(p, out(0), in(0)) && + p->emit_float_to_chan(p, out(1), in(1)) && + p->emit_const_chan(p, out(2), 0) && + p->emit_const_chan(p, out(3), CHAN_MAX); +} + +static GLboolean emit_4chan_4f_rgba_1( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_chan(p, out(0), in(0)) && + p->emit_const_chan(p, out(1), 0) && + p->emit_const_chan(p, out(2), 0) && + p->emit_const_chan(p, out(3), CHAN_MAX); +} + +static GLboolean emit_4ub_4f_rgba_4( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(0), in(0)) && + p->emit_float_to_ubyte(p, out(1), in(1)) && + p->emit_float_to_ubyte(p, out(2), in(2)) && + p->emit_float_to_ubyte(p, out(3), in(3)); +} + +static GLboolean emit_4ub_4f_rgba_3( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(0), in(0)) && + p->emit_float_to_ubyte(p, out(1), in(1)) && + p->emit_float_to_ubyte(p, out(2), in(2)) && + p->emit_const_ubyte(p, out(3), 0xff); +} + +static GLboolean emit_4ub_4f_rgba_2( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(0), in(0)) && + p->emit_float_to_ubyte(p, out(1), in(1)) && + p->emit_const_ubyte(p, out(2), 0) && + p->emit_const_ubyte(p, out(3), 0xff); +} + +static GLboolean emit_4ub_4f_rgba_1( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(0), in(0)) && + p->emit_const_ubyte(p, out(1), 0) && + p->emit_const_ubyte(p, out(2), 0) && + p->emit_const_ubyte(p, out(3), 0xff); +} + +static GLboolean emit_4ub_4f_bgra_4( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(2), in(0)) && + p->emit_float_to_ubyte(p, out(1), in(1)) && + p->emit_float_to_ubyte(p, out(0), in(2)) && + p->emit_float_to_ubyte(p, out(3), in(3)); +} + +static GLboolean emit_4ub_4f_bgra_3( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(2), in(0)) && + p->emit_float_to_ubyte(p, out(1), in(1)) && + p->emit_float_to_ubyte(p, out(0), in(2)) && + p->emit_const_ubyte(p, out(3), 0xff); +} + +static GLboolean emit_4ub_4f_bgra_2( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(2), in(0)) && + p->emit_float_to_ubyte(p, out(1), in(1)) && + p->emit_const_ubyte(p, out(0), 0) && + p->emit_const_ubyte(p, out(3), 0xff); +} + +static GLboolean emit_4ub_4f_bgra_1( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(2), in(0)) && + p->emit_const_ubyte(p, out(1), 0) && + p->emit_const_ubyte(p, out(0), 0) && + p->emit_const_ubyte(p, out(3), 0xff); +} + +static GLboolean emit_3ub_3f_rgb_3( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(0), in(0)) && + p->emit_float_to_ubyte(p, out(1), in(1)) && + p->emit_float_to_ubyte(p, out(2), in(2)); +} + +static GLboolean emit_3ub_3f_rgb_2( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(0), in(0)) && + p->emit_float_to_ubyte(p, out(1), in(1)) && + p->emit_const_ubyte(p, out(2), 0); +} + +static GLboolean emit_3ub_3f_rgb_1( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(0), in(0)) && + p->emit_const_ubyte(p, out(1), 0) && + p->emit_const_ubyte(p, out(2), 0); +} + +static GLboolean emit_3ub_3f_bgr_3( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(2), in(0)) && + p->emit_float_to_ubyte(p, out(1), in(1)) && + p->emit_float_to_ubyte(p, out(0), in(2)); +} + +static GLboolean emit_3ub_3f_bgr_2( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(2), in(0)) && + p->emit_float_to_ubyte(p, out(1), in(1)) && + p->emit_const_ubyte(p, out(0), 0); +} + +static GLboolean emit_3ub_3f_bgr_1( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(2), in(0)) && + p->emit_const_ubyte(p, out(1), 0) && + p->emit_const_ubyte(p, out(0), 0); +} + + +static GLboolean emit_1ub_1f_1( struct tnl_clipspace_codegen *p ) +{ + return + p->emit_float_to_ubyte(p, out(0), in(0)); +} + + + + +static struct { + const char *name; + GLenum out_type; + GLboolean need_vp; + GLboolean (*emit[4])( struct tnl_clipspace_codegen * ); +} emit_info[EMIT_MAX] = { + + { "1f", GL_FLOAT, GL_FALSE, + { emit_1f_1, emit_1f_1, emit_1f_1, emit_1f_1 } }, + + { "2f", GL_FLOAT, GL_FALSE, + { emit_2f_1, emit_2f_2, emit_2f_2, emit_2f_2 } }, + + { "3f", GL_FLOAT, GL_FALSE, + { emit_3f_1, emit_3f_2, emit_3f_3, emit_3f_3 } }, + + { "4f", GL_FLOAT, GL_FALSE, + { emit_4f_1, emit_4f_2, emit_4f_3, emit_4f_4 } }, + + { "2f_viewport", GL_FLOAT, GL_TRUE, + { emit_2f_viewport_1, emit_2f_viewport_2, emit_2f_viewport_2, + emit_2f_viewport_2 } }, + + { "3f_viewport", GL_FLOAT, GL_TRUE, + { emit_3f_viewport_1, emit_3f_viewport_2, emit_3f_viewport_3, + emit_3f_viewport_3 } }, + + { "4f_viewport", GL_FLOAT, GL_TRUE, + { emit_4f_viewport_1, emit_4f_viewport_2, emit_4f_viewport_3, + emit_4f_viewport_4 } }, + + { "3f_xyw", GL_FLOAT, GL_FALSE, + { emit_3f_xyw_err, emit_3f_xyw_err, emit_3f_xyw_err, + emit_3f_xyw_4 } }, + + { "1ub_1f", GL_UNSIGNED_BYTE, GL_FALSE, + { emit_1ub_1f_1, emit_1ub_1f_1, emit_1ub_1f_1, emit_1ub_1f_1 } }, + + { "3ub_3f_rgb", GL_UNSIGNED_BYTE, GL_FALSE, + { emit_3ub_3f_rgb_1, emit_3ub_3f_rgb_2, emit_3ub_3f_rgb_3, + emit_3ub_3f_rgb_3 } }, + + { "3ub_3f_bgr", GL_UNSIGNED_BYTE, GL_FALSE, + { emit_3ub_3f_bgr_1, emit_3ub_3f_bgr_2, emit_3ub_3f_bgr_3, + emit_3ub_3f_bgr_3 } }, + + { "4ub_4f_rgba", GL_UNSIGNED_BYTE, GL_FALSE, + { emit_4ub_4f_rgba_1, emit_4ub_4f_rgba_2, emit_4ub_4f_rgba_3, + emit_4ub_4f_rgba_4 } }, + + { "4ub_4f_bgra", GL_UNSIGNED_BYTE, GL_FALSE, + { emit_4ub_4f_bgra_1, emit_4ub_4f_bgra_2, emit_4ub_4f_bgra_3, + emit_4ub_4f_bgra_4 } }, + + { "4chan_4f_rgba", CHAN_TYPE, GL_FALSE, + { emit_4chan_4f_rgba_1, emit_4chan_4f_rgba_2, emit_4chan_4f_rgba_3, + emit_4chan_4f_rgba_4 } }, + + { "pad", 0, 0, + { 0, 0, 0, 0 } } + +}; + + +/*********************************************************************** + * list(attrib, size) --> function + * + * Because of the dependence of size, this all has to take place after + * the pipeline has been run. + */ + +emit_func _tnl_codegen_emit( GLcontext *ctx ) +{ + struct vertex_buffer *VB = &TNL_CONTEXT(ctx)->vb; + struct tnl_clipspace *vtx = GET_VERTEX_STATE(ctx); + struct tnl_clipspace_attr *a = vtx->attr; + struct tnl_clipspace_codegen *p = &vtx->codegen; + const GLuint count = vtx->attr_count; + GLuint j; + + /* Need a faster lookup, or is this linear scan of an MRU list good + * enough? MRU chosen based on the guess that consecutive VB's are + * likely to be of the same format. A hash of attributes and sizes + * might be a better technique. + * + * With the vtx code now in place, it should be possible to track + * changes to the sizes of input arrays (and state, of course) and + * only invalidate this function when those sizes have changed. + */ +#if 0 + foreach (l, p->codegen_list) { + if (l->attr_count != count) + continue; + + /* Assumptions: + * a[j].vp will not change for a given attrib + * a[j].vertex_offset will not change nothing else has changed. + */ + for (j = 0; j < count; j++) + if (a[j].attrib != l->a[j].attrib || + a[j].sz != l->a[j].sz) + break; + + if (j == count) { + move_to_head(l, p->codegen_list); + return l->func; + } + } +#endif + + p->emit_header( p, vtx ); + + for (j = 0; j < count; j++) { + GLuint sz = VB->AttribPtr[a[j].attrib]->size - 1; + p->emit_attr_header( p, a, j, + emit_info[a[j].format].out_type, + emit_info[a[j].format].need_vp ); + + if (!emit_info[a[j].format].emit[sz]( p )) { + fprintf(stderr, "codegen failed\n"); + return 0; + } + + p->emit_attr_footer( p ); + } + + p->emit_footer( p ); + + return p->emit_store_func( p ); +} + |