/* * Copyright 2000-2001 VA Linux Systems, Inc. * (C) Copyright IBM Corporation 2004 * All Rights Reserved. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * on the rights to use, copy, modify, merge, publish, distribute, sub * license, and/or sell copies of the Software, and to permit persons to whom * the Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice (including the next * paragraph) shall be included in all copies or substantial portions of the * Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL * VA LINUX SYSTEM, IBM AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM, * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE * USE OR OTHER DEALINGS IN THE SOFTWARE. */ /** * \file spantmp2.h * * Template file of span read / write functions. * * \author Keith Whitwell * \author Gareth Hughes * \author Ian Romanick */ #include "main/colormac.h" #include "spantmp_common.h" #ifndef DBG #define DBG 0 #endif #ifndef HW_READ_CLIPLOOP #define HW_READ_CLIPLOOP() HW_CLIPLOOP() #endif #ifndef HW_WRITE_CLIPLOOP #define HW_WRITE_CLIPLOOP() HW_CLIPLOOP() #endif #if (SPANTMP_PIXEL_FMT == GL_RGB) && (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_SHORT_5_6_5) /** ** GL_RGB, GL_UNSIGNED_SHORT_5_6_5 **/ #ifndef GET_VALUE #ifndef GET_PTR #define GET_PTR(_x, _y) (buf + (_x) * 2 + (_y) * pitch) #endif #define GET_VALUE(_x, _y) *(volatile GLushort *)(GET_PTR(_x, _y)) #define PUT_VALUE(_x, _y, _v) *(volatile GLushort *)(GET_PTR(_x, _y)) = (_v) #endif /* GET_VALUE */ #define WRITE_RGBA( _x, _y, r, g, b, a ) \ PUT_VALUE(_x, _y, ((((int)r & 0xf8) << 8) | \ (((int)g & 0xfc) << 3) | \ (((int)b & 0xf8) >> 3))) \ #define WRITE_PIXEL( _x, _y, p ) PUT_VALUE(_x, _y, p) #define READ_RGBA( rgba, _x, _y ) \ do { \ GLushort p = GET_VALUE(_x, _y); \ rgba[0] = ((p >> 8) & 0xf8) * 255 / 0xf8; \ rgba[1] = ((p >> 3) & 0xfc) * 255 / 0xfc; \ rgba[2] = ((p << 3) & 0xf8) * 255 / 0xf8; \ rgba[3] = 0xff; \ } while (0) #elif (SPANTMP_PIXEL_FMT == GL_RGB) && (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_SHORT_5_6_5_REV) /** ** GL_RGB, GL_UNSIGNED_SHORT_5_6_5_REV **/ #ifndef GET_VALUE #ifndef GET_PTR #define GET_PTR(_x, _y) (buf + (_x) * 2 + (_y) * pitch) #endif #define GET_VALUE(_x, _y) *(volatile GLushort *)(GET_PTR(_x, _y)) #define PUT_VALUE(_x, _y, _v) *(volatile GLushort *)(GET_PTR(_x, _y)) = (_v) #endif /* GET_VALUE */ #define WRITE_RGBA( _x, _y, r, g, b, a ) \ PUT_VALUE(_x, _y, PACK_COLOR_565_REV( r, g, b )) #define WRITE_PIXEL( _x, _y, p ) PUT_VALUE(_x, _y, p) #define READ_RGBA( rgba, _x, _y ) \ do { \ GLushort p = GET_VALUE(_x, _y); \ p = p << 8 | p >> 8; \ rgba[0] = ((p >> 8) & 0xf8) * 255 / 0xf8; \ rgba[1] = ((p >> 3) & 0xfc) * 255 / 0xfc; \ rgba[2] = ((p << 3) & 0xf8) * 255 / 0xf8; \ rgba[3] = 0xff; \ } while (0) #elif (SPANTMP_PIXEL_FMT == GL_BGRA) && (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_SHORT_4_4_4_4) /** ** GL_BGRA, GL_UNSIGNED_SHORT_4_4_4_4 **/ #ifndef GET_VALUE #ifndef GET_PTR #define GET_PTR(_x, _y) (buf + (_x) * 2 + (_y) * pitch) #endif #define GET_VALUE(_x, _y) *(volatile GLushort *)(GET_PTR(_x, _y)) #define PUT_VALUE(_x, _y, _v) *(volatile GLushort *)(GET_PTR(_x, _y)) = (_v) #endif /* GET_VALUE */ #define WRITE_RGBA( _x, _y, r, g, b, a ) \ PUT_VALUE(_x, _y, PACK_COLOR_4444_REV(a, r, g, b)) \ #define WRITE_PIXEL( _x, _y, p ) PUT_VALUE(_x, _y, p) #define READ_RGBA( rgba, _x, _y ) \ do { \ GLushort p = GET_VALUE(_x, _y); \ rgba[0] = ((p >> 0) & 0xf) * 0x11; \ rgba[1] = ((p >> 12) & 0xf) * 0x11; \ rgba[2] = ((p >> 4) & 0xf) * 0x11; \ rgba[3] = ((p >> 8) & 0xf) * 0x11; \ } while (0) #elif (SPANTMP_PIXEL_FMT == GL_BGRA) && (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_SHORT_4_4_4_4_REV) /** ** GL_BGRA, GL_UNSIGNED_SHORT_4_4_4_4_REV **/ #ifndef GET_VALUE #ifndef GET_PTR #define GET_PTR(_x, _y) (buf + (_x) * 2 + (_y) * pitch) #endif #define GET_VALUE(_x, _y) *(volatile GLushort *)(GET_PTR(_x, _y)) #define PUT_VALUE(_x, _y, _v) *(volatile GLushort *)(GET_PTR(_x, _y)) = (_v) #endif /* GET_VALUE */ #define WRITE_RGBA( _x, _y, r, g, b, a ) \ PUT_VALUE(_x, _y, PACK_COLOR_4444(a, r, g, b)) \ #define WRITE_PIXEL( _x, _y, p ) PUT_VALUE(_x, _y, p) #define READ_RGBA( rgba, _x, _y ) \ do { \ GLushort p = GET_VALUE(_x, _y); \ rgba[0] = ((p >> 8) & 0xf) * 0x11; \ rgba[1] = ((p >> 4) & 0xf) * 0x11; \ rgba[2] = ((p >> 0) & 0xf) * 0x11; \ rgba[3] = ((p >> 12) & 0xf) * 0x11; \ } while (0) #elif (SPANTMP_PIXEL_FMT == GL_BGRA) && (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_SHORT_1_5_5_5_REV) /** ** GL_BGRA, GL_UNSIGNED_SHORT_1_5_5_5_REV **/ #ifndef GET_VALUE #ifndef GET_PTR #define GET_PTR(_x, _y) (buf + (_x) * 2 + (_y) * pitch) #endif #define GET_VALUE(_x, _y) *(volatile GLushort *)(GET_PTR(_x, _y)) #define PUT_VALUE(_x, _y, _v) *(volatile GLushort *)(GET_PTR(_x, _y)) = (_v) #endif /* GET_VALUE */ #define WRITE_RGBA( _x, _y, r, g, b, a ) \ PUT_VALUE(_x, _y, PACK_COLOR_1555(a, r, g, b)) \ #define WRITE_PIXEL( _x, _y, p ) PUT_VALUE(_x, _y, p) #define READ_RGBA( rgba, _x, _y ) \ do { \ GLushort p = GET_VALUE(_x, _y); \ rgba[0] = ((p >> 7) & 0xf8) * 255 / 0xf8; \ rgba[1] = ((p >> 2) & 0xf8) * 255 / 0xf8; \ rgba[2] = ((p << 3) & 0xf8) * 255 / 0xf8; \ rgba[3] = ((p >> 15) & 0x1) * 0xff; \ } while (0) #elif (SPANTMP_PIXEL_FMT == GL_BGRA) && (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_SHORT_1_5_5_5) /** ** GL_BGRA, GL_UNSIGNED_SHORT_1_5_5_5 **/ #ifndef GET_VALUE #ifndef GET_PTR #define GET_PTR(_x, _y) (buf + (_x) * 2 + (_y) * pitch) #endif #define GET_VALUE(_x, _y) *(volatile GLushort *)(GET_PTR(_x, _y)) #define PUT_VALUE(_x, _y, _v) *(volatile GLushort *)(GET_PTR(_x, _y)) = (_v) #endif /* GET_VALUE */ #define WRITE_RGBA( _x, _y, r, g, b, a ) \ PUT_VALUE(_x, _y, PACK_COLOR_1555_REV(a, r, g, b)) \ #define WRITE_PIXEL( _x, _y, p ) PUT_VALUE(_x, _y, p) #define READ_RGBA( rgba, _x, _y ) \ do { \ GLushort p = GET_VALUE(_x, _y); \ p = p << 8 | p >> 8; \ rgba[0] = ((p >> 7) & 0xf8) * 255 / 0xf8; \ rgba[1] = ((p >> 2) & 0xf8) * 255 / 0xf8; \ rgba[2] = ((p << 3) & 0xf8) * 255 / 0xf8; \ rgba[3] = ((p >> 15) & 0x1) * 0xff; \ } while (0) #elif (SPANTMP_PIXEL_FMT == GL_BGRA) && (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_INT_8_8_8_8_REV) /** ** GL_BGRA, GL_UNSIGNED_INT_8_8_8_8_REV **/ #ifndef GET_VALUE #ifndef GET_PTR #define GET_PTR(_x, _y) ( buf + (_x) * 4 + (_y) * pitch) #endif #define GET_VALUE(_x, _y) *(volatile GLuint *)(GET_PTR(_x, _y)) #define PUT_VALUE(_x, _y, _v) *(volatile GLuint *)(GET_PTR(_x, _y)) = (_v) #endif /* GET_VALUE */ # define WRITE_RGBA(_x, _y, r, g, b, a) \ PUT_VALUE(_x, _y, ((r << 16) | \ (g << 8) | \ (b << 0) | \ (a << 24))) #define WRITE_PIXEL(_x, _y, p) PUT_VALUE(_x, _y, p) # if defined( USE_X86_ASM ) # define READ_RGBA(rgba, _x, _y) \ do { \ GLuint p = GET_VALUE(_x, _y); \ __asm__ __volatile__( "bswap %0; rorl $8, %0" \ : "=r" (p) : "0" (p) ); \ ((GLuint *)rgba)[0] = p; \ } while (0) # elif defined( MESA_BIG_ENDIAN ) /* On PowerPC with GCC 3.4.2 the shift madness below becomes a single * rotlwi instruction. It also produces good code on SPARC. */ # define READ_RGBA( rgba, _x, _y ) \ do { \ GLuint p = GET_VALUE(_x, _y); \ GLuint t = p; \ *((uint32_t *) rgba) = (t >> 24) | (p << 8); \ } while (0) # else # define READ_RGBA( rgba, _x, _y ) \ do { \ GLuint p = GET_VALUE(_x, _y); \ rgba[0] = (p >> 16) & 0xff; \ rgba[1] = (p >> 8) & 0xff; \ rgba[2] = (p >> 0) & 0xff; \ rgba[3] = (p >> 24) & 0xff; \ } while (0) # endif #elif (SPANTMP_PIXEL_FMT == GL_BGRA) && (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_INT_8_8_8_8) /** ** GL_BGRA, GL_UNSIGNED_INT_8_8_8_8 **/ #ifndef GET_VALUE #ifndef GET_PTR #define GET_PTR(_x, _y) ( buf + (_x) * 4 + (_y) * pitch) #endif #define GET_VALUE(_x, _y) *(volatile GLuint *)(GET_PTR(_x, _y)) #define PUT_VALUE(_x, _y, _v) *(volatile GLuint *)(GET_PTR(_x, _y)) = (_v) #endif /* GET_VALUE */ # define WRITE_RGBA(_x, _y, r, g, b, a) \ PUT_VALUE(_x, _y, ((r << 8) | \ (g << 16) | \ (b << 24) | \ (a << 0))) #define WRITE_PIXEL(_x, _y, p) PUT_VALUE(_x, _y, p) # if defined( USE_X86_ASM ) # define READ_RGBA(rgba, _x, _y) \ do { \ GLuint p = GET_VALUE(_x, _y); \ __asm__ __volatile__( "rorl $8, %0" \ : "=r" (p) : "0" (p) ); \ ((GLuint *)rgba)[0] = p; \ } while (0) # elif defined( MESA_BIG_ENDIAN ) /* On PowerPC with GCC 3.4.2 the shift madness below becomes a single * rotlwi instruction. It also produces good code on SPARC. */ # define READ_RGBA( rgba, _x, _y ) \ do { \ GLuint p = CPU_TO_LE32(GET_VALUE(_x, _y)); \ GLuint t = p; \ *((uint32_t *) rgba) = (t >> 24) | (p << 8); \ } while (0) # else # define READ_RGBA( rgba, _x, _y ) \ do { \ GLuint p = GET_VALUE(_x, _y); \ rgba[0] = (p >> 8) & 0xff; \ rgba[1] = (p >> 16) & 0xff; \ rgba[2] = (p >> 24) & 0xff; \ rgba[3] = (p >> 0) & 0xff; \ } while (0) # endif #elif (SPANTMP_PIXEL_FMT == GL_BGR) && (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_INT_8_8_8_8_REV) /** ** GL_BGR, GL_UNSIGNED_INT_8_8_8_8_REV ** ** This is really for MESA_FORMAT_XRGB8888. The spantmp code needs to be ** kicked to the curb, and we need to just code-gen this. **/ #ifndef GET_VALUE #ifndef GET_PTR #define GET_PTR(_x, _y) ( buf + (_x) * 4 + (_y) * pitch) #endif #define GET_VALUE(_x, _y) *(volatile GLuint *)(GET_PTR(_x, _y)) #define PUT_VALUE(_x, _y, _v) *(volatile GLuint *)(GET_PTR(_x, _y)) = (_v) #endif /* GET_VALUE */ # define WRITE_RGBA(_x, _y, r, g, b, a) \ PUT_VALUE(_x, _y, ((r << 16) | \ (g << 8) | \ (b << 0) | \ (0xff << 24))) #define WRITE_PIXEL(_x, _y, p) PUT_VALUE(_x, _y, p) # if defined( USE_X86_ASM ) # define READ_RGBA(rgba, _x, _y) \ do { \ GLuint p = GET_VALUE(_x, _y); \ __asm__ __volatile__( "bswap %0; rorl $8, %0" \ : "=r" (p) : "0" (p) ); \ ((GLuint *)rgba)[0] = p | 0xff000000; \ } while (0) # elif defined( MESA_BIG_ENDIAN ) /* On PowerPC with GCC 3.4.2 the shift madness below becomes a single * rotlwi instruction. It also produces good code on SPARC. */ # define READ_RGBA( rgba, _x, _y ) \ do { \ GLuint p = GET_VALUE(_x, _y); \ *((uint32_t *) rgba) = (p << 8) | 0xff; \ } while (0) # else # define READ_RGBA( rgba, _x, _y ) \ do { \ GLuint p = GET_VALUE(_x, _y); \ rgba[0] = (p >> 16) & 0xff; \ rgba[1] = (p >> 8) & 0xff; \ rgba[2] = (p >> 0) & 0xff; \ rgba[3] = 0xff; \ } while (0) # endif #elif (SPANTMP_PIXEL_FMT == GL_ALPHA) && (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_BYTE) /** ** GL_ALPHA, GL_UNSIGNED_BYTE **/ #ifndef GET_VALUE #ifndef GET_PTR #define GET_PTR(_x, _y) ( buf + (_x) + (_y) * pitch) #endif #define GET_VALUE(_x, _y) *(volatile GLubyte *)(GET_PTR(_x, _y)) #define PUT_VALUE(_x, _y, _v) *(volatile GLubyte *)(GET_PTR(_x, _y)) = (_v) #endif /* GET_VALUE */ # define WRITE_RGBA(_x, _y, r, g, b, a) \ PUT_VALUE(_x, _y, a | (r & 0 /* quiet warnings */)) #define WRITE_PIXEL(_x, _y, p) PUT_VALUE(_x, _y, p) #define READ_RGBA( rgba, _x, _y ) \ do { \ GLubyte p = GET_VALUE(_x, _y); \ rgba[0] = 0; \ rgba[1] = 0; \ rgba[2] = 0; \ rgba[3] = p; \ } while (0) #else #error SPANTMP_PIXEL_FMT must be set to a valid value! #endif /** ** Assembly routines. **/ #if defined( USE_MMX_ASM ) || defined( USE_SSE_ASM ) #include "x86/read_rgba_span_x86.h" #include "x86/common_x86_asm.h" #endif static void TAG(WriteRGBASpan)( struct gl_context *ctx, struct gl_renderbuffer *rb, GLuint n, GLint x, GLint y, const void *values, const GLubyte mask[] ) { (void) ctx; HW_WRITE_LOCK() { const GLubyte (*rgba)[4] = (const GLubyte (*)[4]) values; GLint x1; GLint n1; LOCAL_VARS; y = Y_FLIP(y); HW_WRITE_CLIPLOOP() { GLint i = 0; CLIPSPAN(x,y,n,x1,n1,i); if (DBG) fprintf(stderr, "WriteRGBASpan %d..%d (x1 %d)\n", (int)i, (int)n1, (int)x1); if (mask) { for (;n1>0;i++,x1++,n1--) if (mask[i]) WRITE_RGBA( x1, y, rgba[i][0], rgba[i][1], rgba[i][2], rgba[i][3] ); } else { for (;n1>0;i++,x1++,n1--) WRITE_RGBA( x1, y, rgba[i][0], rgba[i][1], rgba[i][2], rgba[i][3] ); } } HW_ENDCLIPLOOP(); } HW_WRITE_UNLOCK(); } static void TAG(WriteRGBSpan)( struct gl_context *ctx, struct gl_renderbuffer *rb, GLuint n, GLint x, GLint y, const void *values, const GLubyte mask[] ) { (void) ctx; HW_WRITE_LOCK() { const GLubyte (*rgb)[3] = (const GLubyte (*)[3]) values; GLint x1; GLint n1; LOCAL_VARS; y = Y_FLIP(y); HW_WRITE_CLIPLOOP() { GLint i = 0; CLIPSPAN(x,y,n,x1,n1,i); if (DBG) fprintf(stderr, "WriteRGBSpan %d..%d (x1 %d)\n", (int)i, (int)n1, (int)x1); if (mask) { for (;n1>0;i++,x1++,n1--) if (mask[i]) WRITE_RGBA( x1, y, rgb[i][0], rgb[i][1], rgb[i][2], 255 ); } else { for (;n1>0;i++,x1++,n1--) WRITE_RGBA( x1, y, rgb[i][0], rgb[i][1], rgb[i][2], 255 ); } } HW_ENDCLIPLOOP(); } HW_WRITE_UNLOCK(); } static void TAG(WriteRGBAPixels)( struct gl_context *ctx, struct gl_renderbuffer *rb, GLuint n, const GLint x[], const GLint y[], const void *values, const GLubyte mask[] ) { (void) ctx; HW_WRITE_LOCK() { const GLubyte (*rgba)[4] = (const GLubyte (*)[4]) values; GLint i; LOCAL_VARS; if (DBG) fprintf(stderr, "WriteRGBAPixels\n"); HW_WRITE_CLIPLOOP() { if (mask) { for (i=0;i0;i++,x1++,n1--) READ_RGBA( rgba[i], x1, y ); } HW_ENDCLIPLOOP(); } HW_READ_UNLOCK(); } #if defined(GET_PTR) && \ defined(USE_MMX_ASM) && \ (((SPANTMP_PIXEL_FMT == GL_BGRA) && \ (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_INT_8_8_8_8_REV)) || \ ((SPANTMP_PIXEL_FMT == GL_RGB) && \ (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_SHORT_5_6_5))) static void TAG2(ReadRGBASpan,_MMX)( struct gl_context *ctx, struct gl_renderbuffer *rb, GLuint n, GLint x, GLint y, void *values) { #ifndef USE_INNER_EMMS /* The EMMS instruction is directly in-lined here because using GCC's * built-in _mm_empty function was found to utterly destroy performance. */ __asm__ __volatile__( "emms" ); #endif (void) ctx; HW_READ_LOCK() { GLubyte (*rgba)[4] = (GLubyte (*)[4]) values; GLint x1,n1; LOCAL_VARS; y = Y_FLIP(y); if (DBG) fprintf(stderr, "ReadRGBASpan\n"); HW_READ_CLIPLOOP() { GLint i = 0; CLIPSPAN(x,y,n,x1,n1,i); { const void * src = GET_PTR( x1, y ); #if (SPANTMP_PIXEL_FMT == GL_RGB) && \ (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_SHORT_5_6_5) _generic_read_RGBA_span_RGB565_MMX( src, rgba[i], n1 ); #else _generic_read_RGBA_span_BGRA8888_REV_MMX( src, rgba[i], n1 ); #endif } } HW_ENDCLIPLOOP(); } HW_READ_UNLOCK(); #ifndef USE_INNER_EMMS __asm__ __volatile__( "emms" ); #endif } #endif #if defined(GET_PTR) && \ defined(USE_SSE_ASM) && \ (SPANTMP_PIXEL_FMT == GL_BGRA) && \ (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_INT_8_8_8_8_REV) static void TAG2(ReadRGBASpan,_SSE2)( struct gl_context *ctx, struct gl_renderbuffer *rb, GLuint n, GLint x, GLint y, void *values) { (void) ctx; HW_READ_LOCK() { GLubyte (*rgba)[4] = (GLubyte (*)[4]) values; GLint x1,n1; LOCAL_VARS; y = Y_FLIP(y); if (DBG) fprintf(stderr, "ReadRGBASpan\n"); HW_READ_CLIPLOOP() { GLint i = 0; CLIPSPAN(x,y,n,x1,n1,i); { const void * src = GET_PTR( x1, y ); _generic_read_RGBA_span_BGRA8888_REV_SSE2( src, rgba[i], n1 ); } } HW_ENDCLIPLOOP(); } HW_READ_UNLOCK(); } #endif #if defined(GET_PTR) && \ defined(USE_SSE_ASM) && \ (SPANTMP_PIXEL_FMT == GL_BGRA) && \ (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_INT_8_8_8_8_REV) static void TAG2(ReadRGBASpan,_SSE)( struct gl_context *ctx, struct gl_renderbuffer *rb, GLuint n, GLint x, GLint y, void *values) { #ifndef USE_INNER_EMMS /* The EMMS instruction is directly in-lined here because using GCC's * built-in _mm_empty function was found to utterly destroy performance. */ __asm__ __volatile__( "emms" ); #endif (void) ctx; HW_READ_LOCK() { GLubyte (*rgba)[4] = (GLubyte (*)[4]) values; GLint x1,n1; LOCAL_VARS; y = Y_FLIP(y); if (DBG) fprintf(stderr, "ReadRGBASpan\n"); HW_READ_CLIPLOOP() { GLint i = 0; CLIPSPAN(x,y,n,x1,n1,i); { const void * src = GET_PTR( x1, y ); _generic_read_RGBA_span_BGRA8888_REV_SSE( src, rgba[i], n1 ); } } HW_ENDCLIPLOOP(); } HW_READ_UNLOCK(); #ifndef USE_INNER_EMMS __asm__ __volatile__( "emms" ); #endif } #endif static void TAG(ReadRGBAPixels)( struct gl_context *ctx, struct gl_renderbuffer *rb, GLuint n, const GLint x[], const GLint y[], void *values ) { (void) ctx; HW_READ_LOCK() { GLubyte (*rgba)[4] = (GLubyte (*)[4]) values; GLint i; LOCAL_VARS; if (DBG) fprintf(stderr, "ReadRGBAPixels\n"); HW_READ_CLIPLOOP() { for (i=0;iPutRow = TAG(WriteRGBASpan); rb->PutRowRGB = TAG(WriteRGBSpan); rb->PutValues = TAG(WriteRGBAPixels); rb->GetValues = TAG(ReadRGBAPixels); #if defined(GET_PTR) #if defined(USE_SSE_ASM) && \ (SPANTMP_PIXEL_FMT == GL_BGRA) && \ (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_INT_8_8_8_8_REV) if ( cpu_has_xmm2 ) { if (DBG) fprintf( stderr, "Using %s version of GetRow\n", "SSE2" ); rb->GetRow = TAG2(ReadRGBASpan, _SSE2); } else #endif #if defined(USE_SSE_ASM) && \ (SPANTMP_PIXEL_FMT == GL_BGRA) && \ (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_INT_8_8_8_8_REV) if ( cpu_has_xmm ) { if (DBG) fprintf( stderr, "Using %s version of GetRow\n", "SSE" ); rb->GetRow = TAG2(ReadRGBASpan, _SSE); } else #endif #if defined(USE_MMX_ASM) && \ (((SPANTMP_PIXEL_FMT == GL_BGRA) && \ (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_INT_8_8_8_8_REV)) || \ ((SPANTMP_PIXEL_FMT == GL_RGB) && \ (SPANTMP_PIXEL_TYPE == GL_UNSIGNED_SHORT_5_6_5))) if ( cpu_has_mmx ) { if (DBG) fprintf( stderr, "Using %s version of GetRow\n", "MMX" ); rb->GetRow = TAG2(ReadRGBASpan, _MMX); } else #endif #endif /* GET_PTR */ { if (DBG) fprintf( stderr, "Using %s version of GetRow\n", "C" ); rb->GetRow = TAG(ReadRGBASpan); } } #undef WRITE_PIXEL #undef WRITE_RGBA #undef READ_RGBA #undef TAG #undef TAG2 #undef GET_VALUE #undef PUT_VALUE #undef GET_PTR #undef SPANTMP_PIXEL_FMT #undef SPANTMP_PIXEL_TYPE