diff options
author | jbrjake <[email protected]> | 2009-03-19 17:30:56 +0000 |
---|---|---|
committer | jbrjake <[email protected]> | 2009-03-19 17:30:56 +0000 |
commit | 24a14d05f1e1ddc42c9a0ccb9b0c4dfdc2ce29d2 (patch) | |
tree | 886a531b1f78e91bc05cb1f12e531da8fc880c6c /libhb/eedi2.c | |
parent | a5e78ebff48244d281ec149c4f1b88cff328ef99 (diff) |
Ports tritical's EEDI2 deinterlacing interpolator from AviSynth and implements it in the decomb filter as an optional, non-default substitute for yadif's internal, lower quality spatial predictions.
EEDI2 interpolation is enabled by setting mode (the first decomb parameter) to 5. Decomb now accepts -1 as a spatial metric (the second parameter), to bypass combing detection and force deinterlacing of all frames in the specified mode. Additional parameters have been appended to the end of the settings list for decomb, to specify various settings used by EEDI2. The default values for those should work well.
git-svn-id: svn://svn.handbrake.fr/HandBrake/trunk@2264 b64f7644-9d1e-0410-96f1-a4d463321fa5
Diffstat (limited to 'libhb/eedi2.c')
-rw-r--r-- | libhb/eedi2.c | 1870 |
1 files changed, 1870 insertions, 0 deletions
diff --git a/libhb/eedi2.c b/libhb/eedi2.c new file mode 100644 index 000000000..2aa906ef0 --- /dev/null +++ b/libhb/eedi2.c @@ -0,0 +1,1870 @@ +/* $Id: eedi2.c,v 1.0 2009/03/06 5:00:00 jbrjake Exp $ + + This file is part of the HandBrake source code. + Homepage: <http://handbrake.fr/>. + It may be used under the terms of the GNU General Public License. + + The EEDI2 interpolator was created by tritical: + http://web.missouri.edu/~kes25c/ +*/ + +#include "hb.h" +#include "eedi2.h" + +/** + * EEDI2 directional limit lookup table + * + * These values are used to limit the range of edge direction searches and filtering. + */ +const int eedi2_limlut[33] __attribute__ ((aligned (16))) = { + 6, 6, 7, 7, 8, 8, 9, 9, 9, 10, + 10, 11, 11, 12, 12, 12, 12, 12, 12, 12, + 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, + 12, -1, -1 }; + +/** + * Analog of _aligned_malloc + * @param size Size of memory being pointed to + * @param align_size Size of memory chunks to align to (must be power of 2) + */ +void *eedi2_aligned_malloc( size_t size, size_t align_size ) +{ + char * ptr, * ptr2, * aligned_ptr; + int align_mask = align_size - 1; + + ptr = (char *)malloc( size + align_size + sizeof( int ) ); + if( ptr==NULL ) return( NULL ); + + ptr2 = ptr + sizeof( int ); + aligned_ptr = ptr2 + ( align_size - ( (size_t)ptr2 & align_mask ) ); + + + ptr2 = aligned_ptr - sizeof( int ); + *( (int *)ptr2 ) = (int)( aligned_ptr - ptr ); + + return( aligned_ptr ); +} + +/** + * Analog of _aligned_free + * @param ptr The aligned pointer, created with eedi2_aligned_malloc, to be freed + */ +void eedi2_aligned_free( void *ptr ) +{ + int * ptr2 = (int *)ptr - 1; + ptr -= * ptr2; + free(ptr); +} + +/** + * Sorts metrics for median filtering + * @param order Pointer to the table of values to sort + * @param length Length of the order array + */ +void eedi2_sort_metrics( int *order, const int length ) +{ + int i; + for( i = 1; i < length; ++i ) + { + int j = i; + const int temp = order[j]; + while( j > 0 && order[j-1] > temp ) + { + order[j] = order[j-1]; + --j; + } + order[j] = temp; + } +} + +/** + * Bitblits an image plane (overwrites one bitmap with another) + * @param dtsp Pointer to destination bitmap + * @param dst_pitch Stride of destination bitmap + * @param srcp Pointer to source bitmap + * @param src_pitch Stride of destination bitmap + * @param row_size Width of the bitmap being copied + * @param height Height of the source bitmap + * + * When row_size, dst_pitch, and src_pitch are equal, eedi2_bit_blit can work more quickly by copying the whole plane at once instead of individual lines. + */ +void eedi2_bit_blit( uint8_t * dstp, int dst_pitch, + const uint8_t * srcp, int src_pitch, + int row_size, int height ) +{ + if( ( !height ) || ( !row_size ) ) + return; + + if( height == 1 || ( dst_pitch == src_pitch && src_pitch == row_size ) ) + { + memcpy( dstp, srcp, row_size * height ); + } + else + { + int y; + for( y = height; y > 0; --y ) + { + memcpy( dstp, srcp, row_size ); + dstp += dst_pitch; + srcp += src_pitch; + } + } +} + +/** + * A specialized variant of bit_blit, just for setting up the initial, field-sized bitmap planes that EEDI2 interpolates from. + * @param src Pointer to source bitmap plane being copied from + * @param dst Pointer to the destination bitmap plane being copied to + * @param pitch Stride of both bitmaps + * @param height Height of the original, full-size src plane being copied from + */ +void eedi2_fill_half_height_buffer_plane( uint8_t * src, uint8_t * dst, int pitch, int height ) +{ + /* When TFF, we want to copy alternating + lines starting at 0, the top field. + When BFF, we want to start at line 1. */ + int y; + for( y = height; y > 0; y = y - 2 ) + { + memcpy( dst, src, pitch ); + dst += pitch; + src += pitch * 2; + } +} + +/** + * A specialized variant of bit_blit, just for resizing the field-height maps EEDI2 generates to frame-height...a simple line doubler + * @param srcp Pointer to source bitmap plane being copied from + * @param dstp Pointer to the destination bitmap plane being copied to + * @param height Height of the input, half-size src plane being copied from + * @param pitch Stride of both bitmaps + */ +void eedi2_upscale_by_2( uint8_t * srcp, uint8_t * dstp, int height, int pitch ) +{ + int y; + for( y = height; y > 0; y-- ) + { + memcpy( dstp, srcp, pitch ); + dstp += pitch; + memcpy( dstp, srcp, pitch ); + srcp += pitch; + dstp += pitch; + } +} + +/** + * Finds places where verticaly adjacent pixels abruptly change in intensity, i.e., sharp edges. + * @param dstp Pointer to the destination bitmap + * @param dst_pitch Stride of dstp + * @param srcp Pointer to the source bitmap + * @param src_pitch Stride of srcp + * @param mtresh Magnitude threshold, ensures it doesn't mark edges on pixels that are too similar (10 is a good default value) + * @param vthresh Variance threshold, ensures it doesn't look for edges in highly random pixel blocks (20 is a good default value) + * @param lthresh Laplacian threshold, ensures edges are still prominent in the 2nd spatial derivative of the srcp plane (20 is a good default value) + * @param height Height of half-height single-field frame + * @param width Width of srcp bitmap rows, as opposed to the padded stride in src_pitch + */ +void eedi2_build_edge_mask( uint8_t * dstp, int dst_pitch, uint8_t *srcp, int src_pitch, + int mthresh, int lthresh, int vthresh, int height, int width ) +{ + int x, y; + + mthresh = mthresh * 10; + vthresh = vthresh * 81; + + memset( dstp, 0, ( height / 2 ) * dst_pitch ); + + srcp += src_pitch; + dstp += dst_pitch; + unsigned char *srcpp = srcp-src_pitch; + unsigned char *srcpn = srcp+src_pitch; + for( y = 1; y < height - 1; ++y ) + { + for( x = 1; x < width-1; ++x ) + { + if( ( abs( srcpp[x] - srcp[x] ) < 10 && + abs( srcp[x] - srcpn[x] ) < 10 && + abs( srcpp[x] - srcpn[x] ) < 10 ) + || + ( abs( srcpp[x-1] - srcp[x-1] ) < 10 && + abs( srcp[x-1] - srcpn[x-1] ) < 10 && + abs( srcpp[x-1] - srcpn[x-1] ) < 10 && + abs( srcpp[x+1] - srcp[x+1] ) < 10 && + abs( srcp[x+1] - srcpn[x+1] ) < 10 && + abs( srcpp[x+1] - srcpn[x+1] ) < 10) ) + continue; + + const int sum = srcpp[x-1] + srcpp[x] + srcpp[x+1] + + srcp[x-1] + srcp[x]+ srcp[x+1] + + srcpn[x-1] + srcpn[x] + srcpn[x+1]; + + const int sumsq = srcpp[x-1] * srcpp[x-1] + + srcpp[x] * srcpp[x] + + srcpp[x+1] * srcpp[x+1] + + srcp[x-1] * srcp[x-1] + + srcp[x] * srcp[x] + + srcp[x+1] * srcp[x+1] + + srcpn[x-1] * srcpn[x-1] + + srcpn[x] * srcpn[x] + + srcpn[x+1] * srcpn[x+1]; + + if( 9 * sumsq-sum * sum < vthresh ) + continue; + + const int Ix = srcp[x+1] - srcp[x-1]; + const int Iy = MAX( MAX( abs( srcpp[x] - srcpn[x] ), + abs( srcpp[x] - srcp[x] ) ), + abs( srcp[x] - srcpn[x] ) ); + if( Ix * Ix + Iy * Iy >= mthresh ) + { + dstp[x] = 255; + continue; + } + + const int Ixx = srcp[x-1] - 2 * srcp[x] + srcp[x+1]; + const int Iyy = srcpp[x] - 2 * srcp[x] + srcpn[x]; + if( abs( Ixx ) + abs( Iyy ) >= lthresh ) + dstp[x] = 255; + } + dstp += dst_pitch; + srcpp += src_pitch; + srcp += src_pitch; + srcpn += src_pitch; + } +} + +/** + * Expands and smooths out the edge mask + * @param mskp Pointer to the source edge mask being read from + * @param msk_pitch Stride of mskp + * @param dstp Pointer to the destination to store the dilated edge mask + * @param dst_pitch Stride of dstp + * @param dstr Dilation threshold, ensures a pixel is only retained as an edge in dstp if this number of adjacent pixels or greater are also edges in mskp (4 is a good default value) + * @param height Height of half-height field-sized frame + * @param width Width of mskp bitmap rows, as opposed to the pdded stride in msk_pitch + */ +void eedi2_dilate_edge_mask( uint8_t *mskp, int msk_pitch, uint8_t *dstp, int dst_pitch, + int dstr, int height, int width ) +{ + int x, y; + + eedi2_bit_blit( dstp, dst_pitch, mskp, msk_pitch, width, height ); + + mskp += msk_pitch; + unsigned char *mskpp = mskp - msk_pitch; + unsigned char *mskpn = mskp + msk_pitch; + dstp += dst_pitch; + for( y = 1; y < height - 1; ++y ) + { + for( x = 1; x < width - 1; ++x ) + { + if( mskp[x] != 0 ) + continue; + + int count = 0; + if( mskpp[x-1] == 0xFF ) ++count; + if( mskpp[x] == 0xFF ) ++count; + if( mskpp[x+1] == 0xFF ) ++count; + if( mskp[x-1] == 0xFF ) ++count; + if( mskp[x+1] == 0xFF ) ++count; + if( mskpn[x-1] == 0xFF ) ++count; + if( mskpn[x] == 0xFF ) ++count; + if( mskpn[x+1] == 0xFF ) ++count; + + if( count >= dstr ) + dstp[x] = 0xFF; + } + mskpp += msk_pitch; + mskp += msk_pitch; + mskpn += msk_pitch; + dstp += dst_pitch; + } +} + +/** + * Contracts the edge mask + * @param mskp Pointer to the source edge mask being read from + * @param msk_pitch Stride of mskp + * @param dstp Pointer to the destination to store the eroded edge mask + * @param dst_pitch Stride of dstp + * @param estr Erosion threshold, ensures a pixel isn't retained as an edge in dstp if fewer than this number of adjacent pixels are also edges in mskp (2 is a good default value) + * @param height Height of half-height field-sized frame + * @param width Width of mskp bitmap rows, as opposed to the pdded stride in msk_pitch + */ +void eedi2_erode_edge_mask( uint8_t *mskp, int msk_pitch, uint8_t *dstp, int dst_pitch, + int estr, int height, int width ) +{ + int x, y; + + eedi2_bit_blit( dstp, dst_pitch, mskp, msk_pitch, width, height ); + + mskp += msk_pitch; + unsigned char *mskpp = mskp - msk_pitch; + unsigned char *mskpn = mskp + msk_pitch; + dstp += dst_pitch; + for ( y = 1; y < height - 1; ++y ) + { + for ( x = 1; x < width - 1; ++x ) + { + if( mskp[x] != 0xFF ) continue; + + int count = 0; + if ( mskpp[x-1] == 0xFF ) ++count; + if ( mskpp[x] == 0xFF ) ++count; + if ( mskpp[x+1] == 0xFF ) ++count; + if ( mskp[x-1] == 0xFF ) ++count; + if ( mskp[x+1] == 0xFF ) ++count; + if ( mskpn[x-1] == 0xFF ) ++count; + if ( mskpn[x] == 0xFF ) ++count; + if ( mskpn[x+1] == 0xFF ) ++count; + + if ( count < estr) dstp[x] = 0; + } + mskpp += msk_pitch; + mskp += msk_pitch; + mskpn += msk_pitch; + dstp += dst_pitch; + } +} + +/** + * Smooths out horizontally aligned holes in the mask + * + * If none of the 6 horizontally adjacent pixels are edges, mark the current pixel as not edged. + * If at least 1 of the 3 on either side are edges, mark the current pixel as an edge. + * + * @param mskp Pointer to the source edge mask being read from + * @param msk_pitch Stride of mskp + * @param dstp Pointer to the destination to store the smoothed edge mask + * @param dst_pitch Stride of dstp + * @param height Height of half-height field-sized frame + * @param width Width of mskp bitmap rows, as opposed to the pdded stride in msk_pitch + */ +void eedi2_remove_small_gaps( uint8_t * mskp, int msk_pitch, uint8_t * dstp, int dst_pitch, + int height, int width ) +{ + int x, y; + + eedi2_bit_blit( dstp, dst_pitch, mskp, msk_pitch, width, height ); + + mskp += msk_pitch; + dstp += dst_pitch; + for( y = 1; y < height - 1; ++y ) + { + for( x = 3; x < width - 3; ++x ) + { + if( mskp[x] ) + { + if( mskp[x-3] ) continue; + if( mskp[x-2] ) continue; + if( mskp[x-1] ) continue; + if( mskp[x+1] ) continue; + if( mskp[x+2] ) continue; + if( mskp[x+3] ) continue; + dstp[x] = 0; + } + else + { + if ( ( mskp[x+1] && ( mskp[x-1] || mskp[x-2] || mskp[x-3] ) ) || + ( mskp[x+2] && ( mskp[x-1] || mskp[x-2] ) ) || + ( mskp[x+3] && mskp[x-1] ) ) + dstp[x] = 0xFF; + } + } + mskp += msk_pitch; + dstp += dst_pitch; + } +} + +/** + * Calculates spatial direction vectors for the edges. This is EEDI2's timesink, and can be thought of as YADIF_CHECK on steroids, as both try to discern which angle a given edge follows + * @param plane The plane of the image being processed, to know to reduce maxd for chroma planes (HandBrake only works with YUV420 video so it is assumed they are half-height) + * @param mskp Pointer to the source edge mask being read from + * @param msk_pitch Stride of mskp + * @param srcp Pointer to the source image being filtered + * @param src_pitch Stride of srcp + * @param dstp Pointer to the destination to store the dilated edge mask + * @param dst_pitch Stride of dstp + * @param maxd Maximum pixel distance to search (24 is a good default value) + * @param nt Noise threshold (50 is a good default value) + * @param height Height of half-height field-sized frame + * @param width Width of srcp bitmap rows, as opposed to the pdded stride in src_pitch + */ +void eedi2_calc_directions( const int plane, uint8_t * mskp, int msk_pitch, uint8_t * srcp, int src_pitch, + uint8_t * dstp, int dst_pitch, int maxd, int nt, int height, int width ) +{ + int x, y, u, i; + + memset( dstp, 255, dst_pitch * height ); + mskp += msk_pitch; + dstp += dst_pitch; + srcp += src_pitch; + unsigned char *src2p = srcp - src_pitch * 2; + unsigned char *srcpp = srcp - src_pitch; + unsigned char *srcpn = srcp + src_pitch; + unsigned char *src2n = srcp + src_pitch * 2; + unsigned char *mskpp = mskp - msk_pitch; + unsigned char *mskpn = mskp + msk_pitch; + const int maxdt = plane == 0 ? maxd : ( maxd >> 1 ); + + for( y = 1; y < height - 1; ++y ) + { + for( x = 1; x < width - 1; ++x ) + { + if( mskp[x] != 0xFF || ( mskp[x-1] != 0xFF && mskp[x+1] != 0xFF ) ) + continue; + const int startu = MAX( -x + 1, -maxdt ); + const int stopu = MIN( width - 2 - x, maxdt ); + int minb = MIN( 13 * nt, + ( abs( srcp[x] - srcpn[x] ) + + abs( srcp[x] - srcpp[x] ) ) * 6 ); + int mina = MIN( 19 * nt, + ( abs( srcp[x] - srcpn[x] ) + + abs( srcp[x] - srcpp[x] ) ) * 9 ); + int minc = mina; + int mind = minb; + int mine = minb; + int dira = -5000, dirb = -5000, dirc = -5000, dird = -5000, dire = -5000; + for( u = startu; u <= stopu; ++u ) + { + if( y == 1 || + mskpp[x-1+u] == 0xFF || mskpp[x+u] == 0xFF || mskpp[x+1+u] == 0xFF ) + { + if( y == height - 2 || + mskpn[x-1-u] == 0xFF || mskpn[x-u] == 0xFF || mskpn[x+1-u] == 0xFF ) + { + const int diffsn = abs( srcp[x-1] - srcpn[x-1-u] ) + + abs( srcp[x] - srcpn[x-u] ) + + abs( srcp[x+1] - srcpn[x+1-u] ); + + const int diffsp = abs( srcp[x-1] - srcpp[x-1+u] ) + + abs( srcp[x] - srcpp[x+u] ) + + abs( srcp[x+1] - srcpp[x+1+u] ); + + const int diffps = abs( srcpp[x-1] - srcp[x-1-u] ) + + abs( srcpp[x] - srcp[x-u] ) + + abs( srcpp[x+1] - srcp[x+1-u] ); + + const int diffns = abs( srcpn[x-1] - srcp[x-1+u] ) + + abs( srcpn[x] - srcp[x+u] ) + + abs( srcpn[x+1] - srcp[x+1+u] ); + + const int diff = diffsn + diffsp + diffps + diffns; + int diffd = diffsp + diffns; + int diffe = diffsn + diffps; + if( diff < minb ) + { + dirb = u; + minb = diff; + } + if( __builtin_expect( y > 1, 1) ) + { + const int diff2pp = abs( src2p[x-1] - srcpp[x-1-u] ) + + abs( src2p[x] - srcpp[x-u] ) + + abs( src2p[x+1] - srcpp[x+1-u] ); + const int diffp2p = abs( srcpp[x-1] - src2p[x-1+u] ) + + abs( srcpp[x] - src2p[x+u] ) + + abs( srcpp[x+1] - src2p[x+1+u] ); + const int diffa = diff + diff2pp + diffp2p; + diffd += diffp2p; + diffe += diff2pp; + if( diffa < mina ) + { + dira = u; + mina = diffa; + } + } + if( __builtin_expect( y < height-2, 1) ) + { + const int diff2nn = abs( src2n[x-1] - srcpn[x-1+u] ) + + abs( src2n[x] - srcpn[x+u] ) + + abs( src2n[x+1] - srcpn[x+1+u] ); + const int diffn2n = abs( srcpn[x-1] - src2n[x-1-u] ) + + abs( srcpn[x] - src2n[x-u] ) + + abs( srcpn[x+1] - src2n[x+1-u] ); + const int diffc = diff + diff2nn + diffn2n; + diffd += diff2nn; + diffe += diffn2n; + if( diffc < minc ) + { + dirc = u; + minc = diffc; + } + } + if( diffd < mind ) + { + dird = u; + mind = diffd; + } + if( diffe < mine ) + { + dire = u; + mine = diffe; + } + } + } + } + int order[5], k=0; + if( dira != -5000 ) order[k++] = dira; + if( dirb != -5000 ) order[k++] = dirb; + if( dirc != -5000 ) order[k++] = dirc; + if( dird != -5000 ) order[k++] = dird; + if( dire != -5000 ) order[k++] = dire; + if( k > 1 ) + { + eedi2_sort_metrics( order, k ); + const int mid = ( k & 1 ) ? + order[k>>1] : + ( order[(k-1)>>1] + order[k>>1] + 1 ) >> 1; + const int tlim = MAX( eedi2_limlut[abs(mid)] >> 2, 2 ); + int sum = 0, count = 0; + for( i = 0; i < k; ++i ) + { + if( abs( order[i] - mid ) <= tlim ) + { + ++count; + sum += order[i]; + } + } + if( count > 1 ) + dstp[x] = 128 + ( (int)( (float)sum / (float)count ) * 4 ); + else + dstp[x] = 128; + } + else dstp[x] = 128; + } + mskpp += msk_pitch; + mskp += msk_pitch; + mskpn += msk_pitch; + src2p += src_pitch; + srcpp += src_pitch; + srcp += src_pitch; + srcpn += src_pitch; + src2n += src_pitch; + dstp += dst_pitch; + } +} + +/** + * Filters the edge mask + * @param mskp Pointer to the source edge mask being read from + * @param msk_pitch Stride of mskp + * @param dmskp Pointer to the edge direction mask + * @param dmsk_pitch Stride of dmskp + * @param dstp Pointer to the destination to store the filtered edge mask + * @param dst_pitch Stride of dstp + * @param height Height of half-height field-sized frame + * @param width Width of mskp bitmap rows, as opposed to the pdded stride in msk_pitch + */ +void eedi2_filter_map( uint8_t * mskp, int msk_pitch, uint8_t * dmskp, int dmsk_pitch, + uint8_t * dstp, int dst_pitch, int height, int width ) +{ + int x, y, j; + + eedi2_bit_blit( dstp, dst_pitch, dmskp, dmsk_pitch, width, height ); + + mskp += msk_pitch; + dmskp += dmsk_pitch; + dstp += dst_pitch; + unsigned char *dmskpp = dmskp - dmsk_pitch; + unsigned char *dmskpn = dmskp + dmsk_pitch; + + for( y = 1; y < height - 1; ++y ) + { + for( x = 1; x < width - 1; ++x ) + { + if( dmskp[x] == 0xFF || mskp[x] != 0xFF ) + continue; + const int dir = ( dmskp[x] - 128 ) >> 2; + const int lim = MAX( abs( dir ) * 2, 12 ); + int ict = 0, icb = 0; + if( dir < 0 ) + { + const int dirt = MAX( -x, dir ); + for( j = dirt; j <= 0; ++j ) + { + if( ( abs( dmskpp[x+j] - dmskp[x] ) > lim && dmskpp[x+j] != 0xFF ) || + ( dmskp[x+j] == 0xFF && dmskpp[x+j] == 0xFF ) || + ( abs( dmskp[x+j] - dmskp[x] ) > lim && dmskp[x+j] != 0xFF ) ) + { + ict = 1; + break; + } + } + } + else + { + const int dirt = MIN( width - x - 1, dir ); + for( j = 0; j <= dirt; ++j ) + { + if( ( abs( dmskpp[x+j] - dmskp[x] ) > lim && dmskpp[x+j] != 0xFF ) || + ( dmskp[x+j] == 0xFF && dmskpp[x+j] == 0xFF ) || + ( abs( dmskp[x+j] - dmskp[x] ) > lim && dmskp[x+j] != 0xFF ) ) + { + ict = 1; + break; + } + } + } + if( ict ) + { + if( dir < 0 ) + { + const int dirt = MIN( width - x - 1, abs( dir ) ); + for( j = 0; j <= dirt; ++j ) + { + if( ( abs( dmskpn[x+j] - dmskp[x] ) > lim && dmskpn[x+j] != 0xFF ) || + ( dmskpn[x+j] == 0xFF && dmskp[x+j] == 0xFF ) || + ( abs( dmskp[x+j] - dmskp[x] ) > lim && dmskp[x+j] != 0xFF ) ) + { + icb = 1; + break; + } + } + } + else + { + const int dirt = MAX( -x, -dir ); + for( j = dirt; j <= 0; ++j ) + { + if( ( abs( dmskpn[x+j] - dmskp[x] ) > lim && dmskpn[x+j] != 0xFF ) || + ( dmskpn[x+j] == 0xFF && dmskp[x+j] == 0xFF ) || + ( abs( dmskp[x+j] - dmskp[x] ) > lim && dmskp[x+j] != 0xFF ) ) + { + icb = 1; + break; + } + } + } + if( icb ) + dstp[x] = 255; + } + } + mskp += msk_pitch; + dmskpp += dmsk_pitch; + dmskp += dmsk_pitch; + dmskpn += dmsk_pitch; + dstp += dst_pitch; + } +} + + +/** + * Filters the edge direction mask + * @param mskp Pointer to the edge mask + * @param msk_pitch Stride of mskp + * @param dmskp Pointer to the edge direction mask being read from + * @param dmsk_pitch Stride of dmskp + * @param dstp Pointer to the destination to store the filtered edge direction mask + * @param dst_pitch Stride of dstp + * @param height Height of half_height field-sized frame + * @param width Width of dmskp bitmap rows, as opposed to the pdded stride in dmsk_pitch + */ +void eedi2_filter_dir_map( uint8_t * mskp, int msk_pitch, uint8_t * dmskp, int dmsk_pitch, + uint8_t * dstp, int dst_pitch, int height, int width ) +{ + int x, y, i; + + eedi2_bit_blit( dstp, dst_pitch, dmskp, dmsk_pitch, width, height ); + + dmskp += dmsk_pitch; + unsigned char *dmskpp = dmskp - dmsk_pitch; + unsigned char *dmskpn = dmskp + dmsk_pitch; + dstp += dst_pitch; + mskp += msk_pitch; + for( y = 1; y < height - 1; ++y ) + { + for( x = 1; x < width - 1; ++x ) + { + if( mskp[x] != 0xFF ) continue; + int u = 0, order[9]; + if( dmskpp[x-1] != 0xFF ) order[u++] = dmskpp[x-1]; + if( dmskpp[x] != 0xFF ) order[u++] = dmskpp[x]; + if( dmskpp[x+1] != 0xFF ) order[u++] = dmskpp[x+1]; + if( dmskp[x-1] != 0xFF ) order[u++] = dmskp[x-1]; + if( dmskp[x] != 0xFF ) order[u++] = dmskp[x]; + if( dmskp[x+1] != 0xFF ) order[u++] = dmskp[x+1]; + if( dmskpn[x-1] != 0xFF ) order[u++] = dmskpn[x-1]; + if( dmskpn[x] != 0xFF ) order[u++] = dmskpn[x]; + if( dmskpn[x+1] != 0xFF ) order[u++] = dmskpn[x+1]; + if( u < 4 ) + { + dstp[x] = 255; + continue; + } + eedi2_sort_metrics( order, u ); + const int mid = ( u & 1 ) ? + order[u>>1] : ( order[(u-1)>>1] + order[u>>1] + 1 ) >> 1; + int sum = 0, count = 0; + const int lim = eedi2_limlut[abs(mid-128)>>2]; + for( i = 0; i < u; ++i ) + { + if( abs( order[i] - mid ) <= lim ) + { + ++count; + sum += order[i]; + } + } + if( count < 4 || ( count < 5 && dmskp[x] == 0xFF ) ) + { + dstp[x] = 255; + continue; + } + dstp[x] = (int)( ( (float)( sum + mid ) / (float)( count + 1 ) ) + 0.5f ); + } + dmskpp += dmsk_pitch; + dmskp += dmsk_pitch; + dmskpn += dmsk_pitch; + dstp += dst_pitch; + mskp += msk_pitch; + } +} + +/** + * Smoothes out the edge direction map + * @param mskp Pointer to the edge mask + * @param msk_pitch Stride of mskp + * @param dmskp Pointer to the edge direction mask being read from + * @param dmsk_pitch Stride of dmskp + * @param dstp Pointer to the destination to store the expanded edge direction mask + * @param dst_pitch Stride of dstp + * @param height Height of half-height field-sized frame + * @param width Width of dmskp bitmap rows, as opposed to the pdded stride in dmsk_pitch + */ +void eedi2_expand_dir_map( uint8_t * mskp, int msk_pitch, uint8_t * dmskp, int dmsk_pitch, + uint8_t * dstp, int dst_pitch, int height, int width ) +{ + int x, y, i; + + eedi2_bit_blit( dstp, dst_pitch, dmskp, dmsk_pitch, width, height ); + + dmskp += dmsk_pitch; + unsigned char *dmskpp = dmskp - dmsk_pitch; + unsigned char *dmskpn = dmskp + dmsk_pitch; + dstp += dst_pitch; + mskp += msk_pitch; + for( y = 1; y < height - 1; ++y ) + { + for( x = 1; x < width - 1; ++x ) + { + if( dmskp[x] != 0xFF || mskp[x] != 0xFF ) continue; + int u = 0, order[9]; + if( dmskpp[x-1] != 0xFF ) order[u++] = dmskpp[x-1]; + if( dmskpp[x] != 0xFF ) order[u++] = dmskpp[x]; + if( dmskpp[x+1] != 0xFF ) order[u++] = dmskpp[x+1]; + if( dmskp[x-1] != 0xFF ) order[u++] = dmskp[x-1]; + if( dmskp[x+1] != 0xFF ) order[u++] = dmskp[x+1]; + if( dmskpn[x-1] != 0xFF ) order[u++] = dmskpn[x-1]; + if( dmskpn[x] != 0xFF ) order[u++] = dmskpn[x]; + if( dmskpn[x+1] != 0xFF ) order[u++] = dmskpn[x+1]; + if( u < 5 ) continue; + eedi2_sort_metrics( order, u ); + const int mid = ( u & 1 ) ? + order[u>>1] : ( order[(u-1)>>1] + order[u>>1] + 1 ) >> 1; + int sum = 0, count = 0; + const int lim = eedi2_limlut[abs(mid-128)>>2]; + for( i = 0; i < u; ++i ) + { + if( abs( order[i] - mid ) <= lim ) + { + ++count; + sum += order[i]; + } + } + if( count < 5 ) continue; + dstp[x] = (int)( ( (float)( sum + mid ) / (float)( count + 1 ) ) + 0.5f ); + } + dmskpp += dmsk_pitch; + dmskp += dmsk_pitch; + dmskpn += dmsk_pitch; + dstp += dst_pitch; + mskp += msk_pitch; + } +} + +/** + * Re-draws a clearer, less blocky frame-height edge direction mask + * @param mskp Pointer to the edge mask + * @param msk_pitch Stride of mskp + * @param dmskp Pointer to the edge direction mask being read from + * @param dmsk_pitch Stride of dmskp + * @param dstp Pointer to the destination to store the redrawn direction mask + * @param dst_pitch Stride of dstp + * @param tff Whether or not the frame parity is Top Field First + * @param height Height of the full-frame output + * @param width Width of dmskp bitmap rows, as opposed to the pdded stride in dmsk_pitch + */ +void eedi2_mark_directions_2x( uint8_t * mskp, int msk_pitch, uint8_t * dmskp, int dmsk_pitch, + uint8_t * dstp, int dst_pitch, int tff, int height, int width ) +{ + int x, y, i; + memset( dstp, 255, dst_pitch * height ); + dstp += dst_pitch * ( 2 - tff ); + dmskp += dmsk_pitch * ( 1 - tff ); + mskp += msk_pitch * ( 1 - tff ); + unsigned char *dmskpn = dmskp + dmsk_pitch * 2; + unsigned char *mskpn = mskp + msk_pitch * 2; + for( y = 2 - tff; y < height - 1; y += 2 ) + { + for( x = 1; x < width - 1; ++x ) + { + if( mskp[x] != 0xFF && mskpn[x] != 0xFF ) continue; + int v = 0, order[6]; + if( dmskp[x-1] != 0xFF ) order[v++] = dmskp[x-1]; + if( dmskp[x] != 0xFF ) order[v++] = dmskp[x]; + if( dmskp[x+1] != 0xFF ) order[v++] = dmskp[x+1]; + if( dmskpn[x-1] != 0xFF ) order[v++] = dmskpn[x-1]; + if( dmskpn[x] != 0xFF ) order[v++] = dmskpn[x]; + if( dmskpn[x+1] != 0xFF ) order[v++] = dmskpn[x+1]; + if( v < 3 ) continue; + else + { + eedi2_sort_metrics( order, v ); + const int mid = ( v & 1 ) ? order[v>>1] : ( order[(v-1)>>1] + order[v>>1]+1) >> 1; + const int lim = eedi2_limlut[abs(mid-128)>>2]; + int u = 0; + if( abs( dmskp[x-1] - dmskpn[x-1] ) <= lim || + dmskp[x-1] == 0xFF || dmskpn[x-1] == 0xFF ) + ++u; + if( abs( dmskp[x] - dmskpn[x] ) <= lim || + dmskp[x] == 0xFF || dmskpn[x] == 0xFF ) + ++u; + if( abs( dmskp[x+1] - dmskpn[x-1] ) <= lim || + dmskp[x+1] == 0xFF || dmskpn[x+1] == 0xFF) + ++u; + if( u < 2 ) continue; + int count = 0, sum = 0; + for( i = 0; i < v; ++i ) + { + if( abs( order[i] - mid ) <= lim ) + { + ++count; + sum += order[i]; + } + } + if( count < v - 2 || count < 2 ) continue; + dstp[x] = (int)( ( (float)( sum + mid ) / (float)( count + 1 ) ) + 0.5f ); + } + } + mskp += msk_pitch * 2; + mskpn += msk_pitch * 2; + dstp += dst_pitch * 2; + dmskp += dmsk_pitch * 2; + dmskpn += dmsk_pitch * 2; + } +} + +/** + * Filters the frane-height edge direction mask + * @param mskp Pointer to the edge mask + * @param msk_pitch Stride of mskp + * @param dmskp Pointer to the edge direction mask being read from + * @param dmsk_pitch Stride of dmskp + * @param dstp Pointer to the destination to store the filtered direction mask + * @param dst_pitch Stride of dstp + * @param field Field to filter + * @param height Height of the full-frame output + * @param width Width of dmskp bitmap rows, as opposed to the pdded stride in dmsk_pitch + */ +void eedi2_filter_dir_map_2x( uint8_t * mskp, int msk_pitch, uint8_t * dmskp, int dmsk_pitch, + uint8_t * dstp, int dst_pitch, int field, int height, int width ) +{ + int x, y, i; + eedi2_bit_blit( dstp, dst_pitch, dmskp, dmsk_pitch, width, height ); + dmskp += dmsk_pitch * ( 2 - field ); + unsigned char *dmskpp = dmskp - dmsk_pitch * 2; + unsigned char *dmskpn = dmskp + dmsk_pitch * 2; + mskp += msk_pitch * ( 1 - field ); + unsigned char *mskpn = mskp + msk_pitch * 2; + dstp += dst_pitch * ( 2 - field ); + for( y = 2 - field; y < height - 1; y += 2 ) + { + for( x = 1; x < width - 1; ++x ) + { + if( mskp[x] != 0xFF && mskpn[x] != 0xFF ) continue; + int u = 0, order[9]; + if( y > 1 ) + { + if( dmskpp[x-1] != 0xFF ) order[u++] = dmskpp[x-1]; + if( dmskpp[x] != 0xFF ) order[u++] = dmskpp[x]; + if( dmskpp[x+1] != 0xFF ) order[u++] = dmskpp[x+1]; + } + if( dmskp[x-1] != 0xFF ) order[u++] = dmskp[x-1]; + if( dmskp[x] != 0xFF ) order[u++] = dmskp[x]; + if( dmskp[x+1] != 0xFF ) order[u++] = dmskp[x+1]; + if( y < height - 2 ) + { + if( dmskpn[x-1] != 0xFF ) order[u++] = dmskpn[x-1]; + if( dmskpn[x] != 0xFF ) order[u++] = dmskpn[x]; + if( dmskpn[x+1] != 0xFF ) order[u++] = dmskpn[x+1]; + } + if( u < 4 ) + { + dstp[x] = 255; + continue; + } + eedi2_sort_metrics( order, u ); + const int mid = ( u & 1 ) ? order[u>>1] : (order[(u-1)>>1] + order[u>>1] + 1 ) >> 1; + int sum = 0, count = 0; + const int lim = eedi2_limlut[abs(mid-128)>>2]; + for( i = 0; i < u; ++i ) + { + if( abs( order[i] - mid ) <= lim ) + { + ++count; + sum += order[i]; + } + } + if( count < 4 || ( count < 5 && dmskp[x] == 0xFF ) ) + { + dstp[x] = 255; + continue; + } + dstp[x] = (int)( ( (float)( sum + mid ) / (float)( count + 1 ) ) + 0.5f ); + } + mskp += msk_pitch * 2; + mskpn += msk_pitch * 2; + dmskpp += dmsk_pitch * 2; + dmskp += dmsk_pitch * 2; + dmskpn += dmsk_pitch * 2; + dstp += dst_pitch * 2; + } +} + +/** + * Smoothes out the frame-height edge direction mask + * @param mskp Pointer to the edge mask + * @param msk_pitch Stride of mskp + * @param dmskp Pointer to the edge direction mask being read from + * @param dmsk_pitch Stride of dmskp + * @param dstp Pointer to the destination to store the expanded direction mask + * @param dst_pitch Stride of dstp + * @param field Field to filter + * @param height Height of the full-frame output + * @param width Width of dmskp bitmap rows, as opposed to the pdded stride in dmsk_pitch + */ +void eedi2_expand_dir_map_2x( uint8_t * mskp, int msk_pitch, uint8_t * dmskp, int dmsk_pitch, + uint8_t * dstp, int dst_pitch, int field, int height, int width ) +{ + int x, y, i; + + eedi2_bit_blit( dstp, dst_pitch, dmskp, dmsk_pitch, width, height ); + + dmskp += dmsk_pitch * ( 2 - field ); + unsigned char *dmskpp = dmskp - dmsk_pitch * 2; + unsigned char *dmskpn = dmskp + dmsk_pitch * 2; + mskp += msk_pitch * ( 1 - field ); + unsigned char *mskpn = mskp + msk_pitch * 2; + dstp += dst_pitch * ( 2 - field ); + for( y = 2 - field; y < height - 1; y += 2) + { + for( x = 1; x < width - 1; ++x ) + { + if( dmskp[x] != 0xFF || ( mskp[x] != 0xFF && mskpn[x] != 0xFF ) ) continue; + int u = 0, order[9]; + if( y > 1 ) + { + if( dmskpp[x-1] != 0xFF ) order[u++] = dmskpp[x-1]; + if( dmskpp[x] != 0xFF ) order[u++] = dmskpp[x]; + if( dmskpp[x+1] != 0xFF ) order[u++] = dmskpp[x+1]; + } + if( dmskp[x-1] != 0xFF ) order[u++] = dmskp[x-1]; + if( dmskp[x+1] != 0xFF ) order[u++] = dmskp[x+1]; + if( y < height - 2 ) + { + if( dmskpn[x-1] != 0xFF) order[u++] = dmskpn[x-1]; + if( dmskpn[x] != 0xFF) order[u++] = dmskpn[x]; + if( dmskpn[x+1] != 0xFF) order[u++] = dmskpn[x+1]; + } + if( u < 5 ) continue; + eedi2_sort_metrics( order, u ); + const int mid = ( u & 1 ) ? order[u>>1] : ( order[(u-1)>>1] + order[u>>1] + 1 ) >> 1; + int sum = 0, count = 0; + const int lim = eedi2_limlut[abs(mid-128)>>2]; + for( i = 0; i < u; ++i ) + { + if( abs( order[i] - mid ) <= lim ) + { + ++count; + sum += order[i]; + } + } + if( count < 5 ) continue; + dstp[x] = (int)( ( (float)( sum + mid ) / (float)( count + 1 ) ) + 0.5f ); + } + mskp += msk_pitch * 2; + mskpn += msk_pitch * 2; + dmskpp += dmsk_pitch * 2; + dmskp += dmsk_pitch * 2; + dmskpn += dmsk_pitch * 2; + dstp += dst_pitch * 2; + } +} + +/** + * Like the name suggests, this function fills in gaps in the frame-height edge direction mask + * @param mskp Pointer to the edge mask + * @param msk_pitch Stride of mskp + * @param dmskp Pointer to the edge direction mask being read from + * @param dmsk_pitch Stride of dmskp + * @param dstp Pointer to the destination to store the filled-in direction mask + * @param dst_pitch Stride of dstp + * @param field Field to filter + * @param height Height of the full-frame output + * @param width Width of dmskp bitmap rows, as opposed to the pdded stride in dmsk_pitch + */ +void eedi2_fill_gaps_2x( uint8_t *mskp, int msk_pitch, uint8_t * dmskp, int dmsk_pitch, + uint8_t * dstp, int dst_pitch, int field, int height, int width ) +{ + int x, y, j; + + eedi2_bit_blit( dstp, dst_pitch, dmskp, dmsk_pitch, width, height ); + + dmskp += dmsk_pitch * ( 2 - field ); + unsigned char *dmskpp = dmskp - dmsk_pitch * 2; + unsigned char *dmskpn = dmskp + dmsk_pitch * 2; + mskp += msk_pitch * ( 1 - field ); + unsigned char *mskpp = mskp - msk_pitch * 2; + unsigned char *mskpn = mskp + msk_pitch * 2; + unsigned char *mskpnn = mskpn + msk_pitch * 2; + dstp += dst_pitch * ( 2 - field ); + for( y = 2 - field; y < height - 1; y += 2 ) + { + for( x = 1; x < width - 1; ++x ) + { + if( dmskp[x] != 0xFF || + ( mskp[x] != 0xFF && mskpn[x] != 0xFF ) ) continue; + int u = x - 1, back = 500, forward = -500; + while( u ) + { + if( dmskp[u] != 0xFF ) + { + back = dmskp[u]; + break; + } + if( mskp[u] != 0xFF && mskpn[u] != 0xFF ) break; + --u; + } + int v = x + 1; + while( v < width ) + { + if( dmskp[v] != 0xFF ) + { + forward = dmskp[v]; + break; + } + if( mskp[v] != 0xFF && mskpn[v] != 0xFF ) break; + ++v; + } + int tc = 1, bc = 1; + int mint = 500, maxt = -20; + int minb = 500, maxb = -20; + for( j = u; j <= v; ++j ) + { + if( tc ) + { + if( y <= 2 || dmskpp[j] == 0xFF || ( mskpp[j] != 0xFF && mskp[j] != 0xFF ) ) + { + tc = 0; + mint = maxt = 20; + } + else + { + if( dmskpp[j] < mint ) mint = dmskpp[j]; + if( dmskpp[j] > maxt ) maxt = dmskpp[j]; + } + } + if( bc ) + { + if( y >= height - 3 || dmskpn[j] == 0xFF || ( mskpn[j] != 0xFF && mskpnn[j] != 0xFF ) ) + { + bc = 0; + minb = maxb = 20; + } + else + { + if( dmskpn[j] < minb ) minb = dmskpn[j]; + if( dmskpn[j] > maxb ) maxb = dmskpn[j]; + } + } + } + if( maxt == -20 ) maxt = mint = 20; + if( maxb == -20 ) maxb = minb = 20; + int thresh = MAX( + MAX( MAX( abs( forward - 128 ), abs( back - 128 ) ) >> 2, 8 ), + MAX( abs( mint - maxt ), abs( minb - maxb ) ) ); + const int flim = MIN( + MAX( abs( forward - 128 ), abs( back - 128 ) ) >> 2, + 6 ); + if( abs( forward - back ) <= thresh && ( v - u - 1 <= flim || tc || bc ) ) + { + double step = (double)( forward - back ) / (double)( v - u ); + for( j = 0; j < v - u - 1; ++j ) + dstp[u+j+1] = back + (int)( j * step + 0.5 ); + } + } + mskpp += msk_pitch * 2; + mskp += msk_pitch * 2; + mskpn += msk_pitch * 2; + mskpnn += msk_pitch * 2; + dmskpp += dmsk_pitch * 2; + dmskp += dmsk_pitch * 2; + dmskpn += dmsk_pitch * 2; + dstp += dst_pitch * 2; + } +} + +/** + * Actually renders the output frame, based on the edge and edge direction masks + * @param plane The plane of the image being processed, to know to reduce a search distance for chroma planes (HandBrake only works with YUV420 video so it is assumed they are half-height) + * @param dmskp Pointer to the edge direction mask being read from + * @param dmsk_pitch Stride of dmskp + * @param dstp Pointer to the line-doubled source field used being filtered in place + * @param dst_pitch Stride of dstp + * @param omskp Pointer to the destination to store the output edge mask used for post-processing + * @param osmk_pitch Stride of omskp + * @param field Field to filter + * @nt Noise threshold, (50 is a good default value) + * @param height Height of the full-frame output + * @param width Width of dstp bitmap rows, as opposed to the pdded stride in dst_pitch + */ +void eedi2_interpolate_lattice( const int plane, uint8_t * dmskp, int dmsk_pitch, uint8_t * dstp, + int dst_pitch, uint8_t * omskp, int omsk_pitch, int field, int nt, + int height, int width ) +{ + int x, y, u; + + if( field == 1 ) + { + eedi2_bit_blit( dstp + ( height - 1 ) * dst_pitch, + dst_pitch, + dstp + ( height - 2 ) * dst_pitch, + dst_pitch, + width, + 1 ); + } + else + { + eedi2_bit_blit( dstp, + dst_pitch, + dstp + dst_pitch, + dst_pitch, + width, + 1 ); + } + + dstp += dst_pitch * ( 1 - field ); + omskp += omsk_pitch * ( 1 - field ); + unsigned char *dstpn = dstp + dst_pitch; + unsigned char *dstpnn = dstp + dst_pitch * 2; + unsigned char *omskn = omskp + omsk_pitch * 2; + dmskp += dmsk_pitch * ( 2 - field ); + for( y = 2 - field; y < height - 1; y += 2 ) + { + for( x = 0; x < width; ++x ) + { + int dir = dmskp[x]; + const int lim = eedi2_limlut[abs(dir-128)>>2]; + if( dir == 255 || + ( abs( dmskp[x] - dmskp[x-1] ) > lim && + abs( dmskp[x] - dmskp[x+1] ) > lim ) ) + { + dstpn[x] = ( dstp[x] + dstpnn[x] + 1 ) >> 1; + if( dir != 255 ) dmskp[x] = 128; + continue; + } + if( lim < 9 ) + { + const int sum = dstp[x-1] + dstp[x] + dstp[x+1] + + dstpnn[x-1] + dstpnn[x] + dstpnn[x+1]; + const int sumsq = dstp[x-1] * dstp[x-1] + + dstp[x] * dstp[x] + + dstp[x+1] * dstp[x+1] + + dstpnn[x-1] * dstpnn[x-1] + + dstpnn[x] * dstpnn[x] + + dstpnn[x+1] * dstpnn[x+1]; + if( 6 * sumsq - sum * sum < 576 ) + { + dstpn[x] = ( dstp[x] + dstpnn[x] + 1 ) >> 1; + dmskp[x] = 255; + continue; + } + } + if( x > 1 && x < width - 2 && + ( dstp[x] < MAX( dstp[x-2], dstp[x-1] ) - 3 && + dstp[x] < MAX( dstp[x+2], dstp[x+1] ) - 3 && + dstpnn[x] < MAX( dstpnn[x-2], dstpnn[x-1] ) - 3 && + dstpnn[x] < MAX( dstpnn[x+2], dstpnn[x+1] ) - 3 ) + || + ( dstp[x] > MIN( dstp[x-2], dstp[x-1] ) + 3 && + dstp[x] > MIN( dstp[x+2], dstp[x+1] ) + 3 && + dstpnn[x] > MIN( dstpnn[x-2], dstpnn[x-1] ) + 3 && + dstpnn[x] > MIN( dstpnn[x+2], dstpnn[x+1] ) + 3 ) ) + { + dstpn[x] = ( dstp[x] + dstpnn[x] + 1 ) >> 1; + dmskp[x] = 128; + continue; + } + dir = ( dir - 128 + 2 ) >> 2; + int val = ( dstp[x] + dstpnn[x] + 1 ) >> 1; + const int startu = ( dir - 2 < 0 ) ? + MAX( -x + 1, MAX( dir - 2, -width + 2 + x ) ) + : + MIN( x - 1, MIN( dir - 2, width - 2 - x ) ); + const int stopu = ( dir + 2 < 0 ) ? + MAX( -x + 1, MAX( dir + 2, -width + 2 + x ) ) + : + MIN( x - 1, MIN( dir + 2, width - 2 - x ) ); + int min = 8 * nt; + for( u = startu; u <= stopu; ++u ) + { + const int diff = + abs( dstp[x-1] - dstpnn[x-u-1] ) + + abs( dstp[x] - dstpnn[x-u] ) + + abs( dstp[x+1] - dstpnn[x-u+1] ) + + abs( dstpnn[x-1] - dstp[x+u-1] ) + + abs( dstpnn[x] - dstp[x+u] ) + + abs( dstpnn[x+1] - dstp[x+u+1] ); + if( diff < min && + ( ( omskp[x-1+u] != 0xFF && abs( omskp[x-1+u] - dmskp[x] ) <= lim ) || + ( omskp[x+u] != 0xFF && abs( omskp[x+u] - dmskp[x]) <= lim ) || + ( omskp[x+1+u] != 0xFF && abs( omskp[x+1+u] - dmskp[x]) <= lim ) ) && + ( ( omskn[x-1-u] != 0xFF && abs( omskn[x-1-u] - dmskp[x]) <= lim ) || + ( omskn[x-u] != 0xFF && abs( omskn[x-u] - dmskp[x]) <= lim ) || + ( omskn[x+1-u] != 0xFF && abs( omskn[x+1-u] - dmskp[x]) <= lim ) ) ) + { + const int diff2 = + abs( dstp[x+(u>>1)-1] - dstpnn[x-(u>>1)-1] ) + + abs( dstp[x+(u>>1)] - dstpnn[x-(u>>1)] ) + + abs( dstp[x+(u>>1)+1] - dstpnn[x-(u>>1)+1] ); + if( diff2 < 4 * nt && + ( ( ( abs( omskp[x+(u>>1)] - omskn[x-(u>>1)] ) <= lim || + abs( omskp[x+(u>>1)] - omskn[x-((u+1)>>1)] ) <= lim ) && + omskp[x+(u>>1)] != 0xFF ) + || + ( ( abs( omskp[x+((u+1)>>1)] - omskn[x-(u>>1)] ) <= lim || + abs( omskp[x+((u+1)>>1)] - omskn[x-((u+1)>>1)] ) <= lim ) && + omskp[x+((u+1)>>1)] != 0xFF ) ) ) + { + if( ( abs( dmskp[x] - omskp[x+(u>>1)] ) <= lim || + abs( dmskp[x] - omskp[x+((u+1)>>1)] ) <= lim ) && + ( abs( dmskp[x] - omskn[x-(u>>1)] ) <= lim || + abs( dmskp[x] - omskn[x-((u+1)>>1)] ) <= lim ) ) + { + val = ( dstp[x+(u>>1)] + dstp[x+((u+1)>>1)] + + dstpnn[x-(u>>1)] + dstpnn[x-((u+1)>>1)] + 2 ) >> 2; + min = diff; + dir = u; + } + } + } + } + if( min != 8 * nt ) + { + dstpn[x] = val; + dmskp[x] = 128 + dir * 4; + } + else + { + const int minm = MIN( dstp[x], dstpnn[x] ); + const int maxm = MAX( dstp[x], dstpnn[x] ); + const int d = plane == 0 ? 4 : 2; + const int startu = MAX( -x + 1, -d ); + const int stopu = MIN( width - 2 - x, d ); + min = 7 * nt; + for( u = startu; u <= stopu; ++u ) + { + const int p1 = dstp[x+(u>>1)] + dstp[x+((u+1)>>1)]; + const int p2 = dstpnn[x-(u>>1)] + dstpnn[x-((u+1)>>1)]; + const int diff = + abs( dstp[x-1] - dstpnn[x-u-1] ) + + abs( dstp[x] - dstpnn[x-u] ) + + abs( dstp[x+1] - dstpnn[x-u+1] ) + + abs( dstpnn[x-1] - dstp[x+u-1] ) + + abs( dstpnn[x] - dstp[x+u] ) + + abs( dstpnn[x+1] - dstp[x+u+1] ) + + abs( p1 - p2 ); + if( diff < min ) + { + const int valt = ( p1 + p2 + 2 ) >> 2; + if( valt >= minm && valt <= maxm ) + { + val = valt; + min = diff; + dir = u; + } + } + } + dstpn[x] = val; + if( min == 7*nt ) dmskp[x] = 128; + else dmskp[x] = 128 + dir * 4; + } + } + dstp += dst_pitch * 2; + dstpn += dst_pitch * 2; + dstpnn += dst_pitch * 2; + dmskp += dmsk_pitch * 2; + omskp += omsk_pitch * 2; + omskn += omsk_pitch * 2; + } +} + +/** + * Applies some extra filtering to smooth the edge direction mask + * @param nmskp Pointer to the newly-filtered edge direction mask being read from + * @param nmsk_pitch Stride of nmskp + * @param omskp Pointer to the old unfiltered edge direction mask being read from + * @param omsk_pitch Stride of osmkp + * @param dstp Pointer to the output image being filtered in place + * @param src_pitch Stride of dstp ....not sure why it's named this + * @param field Field to filter + * @param height Height of the full-frame output + * @param width Width of dstp bitmap rows, as opposed to the pdded stride in src_pitch + */ +void eedi2_post_process( uint8_t * nmskp, int nmsk_pitch, uint8_t * omskp, int omsk_pitch, + uint8_t * dstp, int src_pitch, int field, int height, int width ) +{ + int x, y; + + nmskp += ( 2 - field ) * nmsk_pitch; + omskp += ( 2 - field ) * omsk_pitch; + dstp += ( 2 - field ) * src_pitch; + unsigned char *srcpp = dstp - src_pitch; + unsigned char *srcpn = dstp + src_pitch; + for( y = 2 - field; y < height - 1; y += 2 ) + { + for( x = 0; x < width; ++x ) + { + const int lim = eedi2_limlut[abs(nmskp[x]-128)>>2]; + if( abs( nmskp[x] - omskp[x] ) > lim && omskp[x] != 255 && omskp[x] != 128 ) + dstp[x] = ( srcpp[x] + srcpn[x] + 1 ) >> 1; + } + nmskp += nmsk_pitch * 2; + omskp += omsk_pitch * 2; + srcpp += src_pitch * 2; + dstp += src_pitch * 2; + srcpn += src_pitch * 2; + } +} + +/** + * Blurs the source field plane + * @param src Pointer to the half-height source field plane + * @param src_pitch Stride of src + * @param tmp Pointer to a temporary buffer for juggling bitmaps + * @param tmp_pitch Stride of tmp + * @param dst Pointer to the destination to store the blurred field plane + * @param dst_pitch Stride of dst + * @param height Height of the hakf-height field-sized frame + * @param width Width of dstp bitmap rows, as opposed to the padded stride in dst_pitch + */ +void eedi2_gaussian_blur1( uint8_t * src, int src_pitch, uint8_t * tmp, int tmp_pitch, uint8_t * dst, int dst_pitch, int height, int width ) +{ + uint8_t * srcp = src; + uint8_t * dstp = tmp; + int x, y; + + for( y = 0; y < height; ++y ) + { + dstp[0] = ( srcp[3] * 582 + srcp[2] * 7078 + srcp[1] * 31724 + + srcp[0] * 26152 + 32768 ) >> 16; + dstp[1] = ( srcp[4] * 582 + srcp[3] * 7078 + + ( srcp[0] + srcp[2] ) * 15862 + + srcp[1] * 26152 + 32768 ) >> 16; + dstp[2] = ( srcp[5] * 582 + ( srcp[0] + srcp[4] ) * 3539 + + ( srcp[1] + srcp[3] ) * 15862 + + srcp[2]*26152 + 32768 ) >> 16; + for( x = 3; x < width - 3; ++x ) + { + dstp[x] = ( ( srcp[x-3] + srcp[x+3] ) * 291 + + ( srcp[x-2] + srcp[x+2] ) * 3539 + + ( srcp[x-1] + srcp[x+1] ) * 15862 + + srcp[x] * 26152 + 32768 ) >> 16; + } + dstp[x] = ( srcp[x-3] * 582 + ( srcp[x-2] + srcp[x+2] ) * 3539 + + ( srcp[x-1] + srcp[x+1] ) * 15862 + + srcp[x] * 26152 + 32768 ) >> 16; + ++x; + dstp[x] = ( srcp[x-3] * 582 + srcp[x-2] * 7078 + + ( srcp[x-1] + srcp[x+1] ) * 15862 + + srcp[x] * 26152 + 32768 ) >> 16; + ++x; + dstp[x] = ( srcp[x-3] * 582 + srcp[x-2] * 7078 + + srcp[x-1] * 31724 + srcp[x] * 26152 + 32768 ) >> 16; + srcp += src_pitch; + dstp += tmp_pitch; + } + srcp = tmp; + dstp = dst; + unsigned char *src3p = srcp - tmp_pitch * 3; + unsigned char *src2p = srcp - tmp_pitch * 2; + unsigned char *srcpp = srcp - tmp_pitch; + unsigned char *srcpn = srcp + tmp_pitch; + unsigned char *src2n = srcp + tmp_pitch * 2; + unsigned char *src3n = srcp + tmp_pitch * 3; + for( x = 0; x < width; ++x ) + { + dstp[x] = ( src3n[x] * 582 + src2n[x] * 7078 + srcpn[x] * 31724 + + srcp[x] * 26152 + 32768 ) >> 16; + } + src3p += tmp_pitch; + src2p += tmp_pitch; + srcpp += tmp_pitch; + srcp += tmp_pitch; + srcpn += tmp_pitch; + src2n += tmp_pitch; + src3n += tmp_pitch; + dstp += dst_pitch; + for( x = 0; x < width; ++x ) + { + dstp[x] = ( src3n[x] * 582 + src2n[x] * 7078 + + ( srcpp[x] + srcpn[x] ) * 15862 + + srcp[x] * 26152 + 32768 ) >> 16; + } + src3p += tmp_pitch; + src2p += tmp_pitch; + srcpp += tmp_pitch; + srcp += tmp_pitch; + srcpn += tmp_pitch; + src2n += tmp_pitch; + src3n += tmp_pitch; + dstp += dst_pitch; + for( x = 0; x < width; ++x ) + { + dstp[x] = ( src3n[x] * 582 + ( src2p[x] + src2n[x] ) * 3539 + + ( srcpp[x] + srcpn[x] ) * 15862 + + srcp[x] * 26152 + 32768 ) >> 16; + } + src3p += src_pitch; + src2p += src_pitch; + srcpp += src_pitch; + srcp += src_pitch; + srcpn += src_pitch; + src2n += src_pitch; + src3n += src_pitch; + dstp += dst_pitch; + for( y = 3; y < height - 3; ++y ) + { + for( x = 0; x < width; ++x ) + { + dstp[x] = ( ( src3p[x] + src3n[x] ) * 291 + + ( src2p[x] + src2n[x] ) * 3539 + + ( srcpp[x] + srcpn[x] ) * 15862 + + srcp[x] * 26152 + 32768 ) >> 16; + } + src3p += tmp_pitch; + src2p += tmp_pitch; + srcpp += tmp_pitch; + srcp += tmp_pitch; + srcpn += tmp_pitch; + src2n += tmp_pitch; + src3n += tmp_pitch; + dstp += dst_pitch; + } + for( x = 0; x < width; ++x ) + { + dstp[x] = ( src3p[x] * 582 + ( src2p[x] + src2n[x] ) *3539 + + ( srcpp[x] + srcpn[x] ) * 15862 + + srcp[x] * 26152 + 32768 ) >> 16; + } + src3p += tmp_pitch; + src2p += tmp_pitch; + srcpp += tmp_pitch; + srcp += tmp_pitch; + srcpn += tmp_pitch; + src2n += tmp_pitch; + src3n += tmp_pitch; + dstp += dst_pitch; + for( x = 0; x < width; ++x ) + { + dstp[x] = ( src3p[x] * 582 + src2p[x] * 7078 + + ( srcpp[x] + srcpn[x] ) * 15862 + + srcp[x] * 26152 + 32768 ) >> 16; + } + src3p += tmp_pitch; + src2p += tmp_pitch; + srcpp += tmp_pitch; + srcp += tmp_pitch; + srcpn += tmp_pitch; + src2n += tmp_pitch; + src3n += tmp_pitch; + dstp += dst_pitch; + for( x = 0; x < width; ++x ) + { + dstp[x] = ( src3p[x] * 582 + src2p[x] * 7078 + + srcpp[x] * 31724 + srcp[x] * 26152 + 32768 ) >> 16; + } +} + + +/** + * Blurs the spatial derivatives of the source field plane + * @param src Pointer to the derivative array to filter + * @param tmp Pointer to a temporary storage for the derivative array while it's being filtered + * @param dst Pointer to the destination to store the filtered output derivative array + * @param pitch Stride of the bitmap from which the src array is derived + * @param height Height of the half-height field-sized frame from which the src array derivs were taken + * @param width Width of the bitmap from which the src array is derived, as opposed to the padded stride in pitch + */ +void eedi2_gaussian_blur_sqrt2( int *src, int *tmp, int *dst, const int pitch, int height, const int width ) +{ + int * srcp = src; + int * dstp = tmp; + int x, y; + + for( y = 0; y < height; ++y ) + { + x = 0; + dstp[x] = ( srcp[x+4] * 678 + srcp[x+3] * 3902 + srcp[x+2] * 13618 + + srcp[x+1] * 28830 + srcp[x] * 18508 + 32768 ) >> 16; + ++x; + dstp[x] = ( srcp[x+4] * 678 + srcp[x+3] * 3902 + srcp[x+2] * 13618 + + ( srcp[x-1] + srcp[x+1] ) *14415 + + srcp[x] * 18508 + 32768 ) >> 16; + ++x; + dstp[x] = ( srcp[x+4] * 678 + srcp[x+3] * 3902 + + ( srcp[x-2] + srcp[x+2] ) * 6809 + + ( srcp[x-1] + srcp[x+1] ) * 14415 + + srcp[x] * 18508 + 32768 ) >> 16; + ++x; + dstp[x] = ( srcp[x+4] * 678 + ( srcp[x-3] + srcp[x+3] ) * 1951 + + ( srcp[x-2] + srcp[x+2] ) * 6809 + + ( srcp[x-1] + srcp[x+1] ) * 14415 + + srcp[x] * 18508 + 32768 ) >> 16; + + for( x = 4; x < width - 4; ++x ) + { + dstp[x] = ( ( srcp[x-4] + srcp[x+4] ) * 339 + + ( srcp[x-3] + srcp[x+3] ) * 1951 + + ( srcp[x-2] + srcp[x+2] ) * 6809 + + ( srcp[x-1] + srcp[x+1] ) * 14415 + + srcp[x] * 18508 + 32768 ) >> 16; + } + + dstp[x] = ( srcp[x-4] * 678 + ( srcp[x-3] + srcp[x+3] ) * 1951 + + ( srcp[x-2] + srcp[x+2] ) * 6809 + + ( srcp[x-1] + srcp[x+1] ) * 14415 + + srcp[x] * 18508 + 32768 ) >> 16; + ++x; + dstp[x] = ( srcp[x-4] * 678 + srcp[x-3] * 3902 + + ( srcp[x-2] + srcp[x+2] ) * 6809 + + ( srcp[x-1] + srcp[x+1] ) * 14415 + + srcp[x] * 18508 + 32768 ) >> 16; + ++x; + dstp[x] = ( srcp[x-4] * 678 + srcp[x+3] * 3902 + srcp[x-2] * 13618 + + ( srcp[x-1] + srcp[x+1] ) * 14415 + + srcp[x] * 18508 + 32768 ) >> 16; + ++x; + dstp[x] = ( srcp[x-4] * 678 + srcp[x-3] * 3902 + srcp[x-2] * 13618 + + srcp[x-1] * 28830 + + srcp[x] * 18508 + 32768 ) >> 16; + srcp += pitch; + dstp += pitch; + } + dstp = dst; + srcp = tmp; + int * src4p = srcp - pitch * 4; + int * src3p = srcp - pitch * 3; + int * src2p = srcp - pitch * 2; + int * srcpp = srcp - pitch; + int * srcpn = srcp + pitch; + int * src2n = srcp + pitch * 2; + int * src3n = srcp + pitch * 3; + int * src4n = srcp + pitch * 4; + for( x = 0; x < width; ++x ) + { + dstp[x] = ( src4n[x] * 678 + src3n[x] * 3902 + + src2n[x] * 13618 + srcpn[x] * 28830 + + srcp[x] * 18508 + 32768 ) >> 18; + } + src4p += pitch; + src3p += pitch; + src2p += pitch; + srcpp += pitch; + srcp += pitch; + srcpn += pitch; + src2n += pitch; + src3n += pitch; + src4n += pitch; + dstp += pitch; + for( x = 0; x < width; ++x ) + { + dstp[x] = ( src4n[x] * 678 + src3n[x] * 3902 + src2n[x] * 13618 + + ( srcpp[x] + srcpn[x] ) * 14415 + + srcp[x] * 18508 + 32768 ) >> 18; + } + src4p += pitch; + src3p += pitch; + src2p += pitch; + srcpp += pitch; + srcp += pitch; + srcpn += pitch; + src2n += pitch; + src3n += pitch; + src4n += pitch; + dstp += pitch; + for( x = 0; x < width; ++x ) + { + dstp[x] = ( src4n[x] * 678 + src3n[x] * 3902 + + ( src2p[x] + src2n[x] ) * 6809 + + ( srcpp[x] + srcpn[x] ) * 14415 + + srcp[x] * 18508 + 32768 ) >> 18; + } + src4p += pitch; + src3p += pitch; + src2p += pitch; + srcpp += pitch; + srcp += pitch; + srcpn += pitch; + src2n += pitch; + src3n += pitch; + src4n += pitch; + dstp += pitch; + for( x = 0; x < width; ++x ) + { + dstp[x] = ( src4n[x] * 678 + ( src3p[x] + src3n[x] ) * 1951 + + ( src2p[x] + src2n[x] ) * 6809 + + ( srcpp[x] + srcpn[x] ) * 14415 + + srcp[x] * 18508 + 32768 ) >> 18; + } + src4p += pitch; + src3p += pitch; + src2p += pitch; + srcpp += pitch; + srcp += pitch; + srcpn += pitch; + src2n += pitch; + src3n += pitch; + src4n += pitch; + dstp += pitch; + for( y = 4; y < height - 4; ++y ) + { + for( x = 0; x < width; ++x ) + { + dstp[x] = ( ( src4p[x] + src4n[x] ) * 339 + + ( src3p[x] + src3n[x] ) * 1951 + + ( src2p[x] + src2n[x] ) * 6809 + + ( srcpp[x] + srcpn[x] ) * 14415 + + srcp[x] * 18508 + 32768 ) >> 18; + } + src4p += pitch; + src3p += pitch; + src2p += pitch; + srcpp += pitch; + srcp += pitch; + srcpn += pitch; + src2n += pitch; + src3n += pitch; + src4n += pitch; + dstp += pitch; + } + for( x = 0; x < width; ++x ) + { + dstp[x] = ( src4p[x] * 678 + + ( src3p[x] + src3n[x] ) * 1951 + + ( src2p[x] + src2n[x] ) * 6809 + + ( srcpp[x] + srcpn[x] ) * 14415 + + srcp[x] * 18508 + 32768 ) >> 18; + } + src4p += pitch; + src3p += pitch; + src2p += pitch; + srcpp += pitch; + srcp += pitch; + srcpn += pitch; + src2n += pitch; + src3n += pitch; + src4n += pitch; + dstp += pitch; + for( x = 0; x < width; ++x ) + { + dstp[x] = ( src4p[x] * 678 + src3p[x] * 3902 + + ( src2p[x] + src2n[x] ) * 6809 + + ( srcpp[x] + srcpn[x] ) * 14415 + + srcp[x] * 18508 + 32768 ) >> 18; + } + src4p += pitch; + src3p += pitch; + src2p += pitch; + srcpp += pitch; + srcp += pitch; + srcpn += pitch; + src2n += pitch; + src3n += pitch; + src4n += pitch; + dstp += pitch; + for( x = 0; x < width; ++x ) + { + dstp[x] = ( src4p[x] * 678 + src3p[x] * 3902 + src2p[x] * 13618 + + ( srcpp[x] + srcpn[x] ) * 14415 + + srcp[x] * 18508 + 32768 ) >> 18; + } + src4p += pitch; + src3p += pitch; + src2p += pitch; + srcpp += pitch; + srcp += pitch; + srcpn += pitch; + src2n += pitch; + src3n += pitch; + src4n += pitch; + dstp += pitch; + for( x = 0; x < width; ++x ) + { + dstp[x] = ( src4p[x] * 678 + src3p[x] * 3902 + + src2p[x] * 13618 + srcpp[x] * 28830 + + srcp[x] * 18508 + 32768 ) >> 18; + } +} + +/** + * Finds spatial derivatives for a a source field plane + * @param srcp Pointer to the plane to derive + * @param src_pitch Stride of srcp + * @param height Height of the half-height field-sized frame + * @param width Width of srcp bitmap rows, as opposed to the padded stride in src_pitch + * @param x2 Pointed to the array to store the x/x derivatives + * @param y2 Pointer to the array to store the y/y derivatives + * @param xy Pointer to the array to store the x/y derivatives + */ +void eedi2_calc_derivatives( uint8_t *srcp, int src_pitch, int height, int width, int *x2, int *y2, int *xy) +{ + + unsigned char * srcpp = srcp - src_pitch; + unsigned char * srcpn = srcp + src_pitch; + int x, y; + { + const int Ix = srcp[1] - srcp[0]; + const int Iy = srcp[0] - srcpn[0]; + x2[0] = ( Ix * Ix ) >> 1; + y2[0] = ( Iy * Iy ) >> 1; + xy[0] = ( Ix * Iy ) >> 1; + } + for( x = 1; x < width - 1; ++x ) + { + const int Ix = srcp[x+1] - srcp[x-1]; + const int Iy = srcp[x] - srcpn[x]; + x2[x] = ( Ix * Ix ) >> 1; + y2[x] = ( Iy * Iy ) >> 1; + xy[x] = ( Ix * Iy ) >> 1; + } + { + const int Ix = srcp[x] - srcp[x-1]; + const int Iy = srcp[x] - srcpn[x]; + x2[x] = ( Ix * Ix ) >> 1; + y2[x] = ( Iy * Iy ) >> 1; + xy[x] = ( Ix * Iy ) >> 1; + } + srcpp += src_pitch; + srcp += src_pitch; + srcpn += src_pitch; + x2 += src_pitch; + y2 += src_pitch; + xy += src_pitch; + for( y = 1; y < height - 1; ++y ) + { + { + const int Ix = srcp[1] - srcp[0]; + const int Iy = srcpp[0] - srcpn[0]; + x2[0] = ( Ix * Ix ) >> 1; + y2[0] = ( Iy * Iy ) >> 1; + xy[0] = ( Ix * Iy ) >> 1; + } + for ( x = 1; x < width - 1; ++x ) + { + const int Ix = srcp[x+1] - srcp[x-1]; + const int Iy = srcpp[x] - srcpn[x]; + x2[x] = ( Ix * Ix ) >> 1; + y2[x] = ( Iy * Iy ) >> 1; + xy[x] = ( Ix * Iy ) >> 1; + } + { + const int Ix = srcp[x] - srcp[x-1]; + const int Iy = srcpp[x] - srcpn[x]; + x2[x] = ( Ix *Ix ) >> 1; + y2[x] = ( Iy *Iy ) >> 1; + xy[x] = ( Ix *Iy ) >> 1; + } + srcpp += src_pitch; + srcp += src_pitch; + srcpn += src_pitch; + x2 += src_pitch; + y2 += src_pitch; + xy += src_pitch; + } + { + const int Ix = srcp[1] - srcp[0]; + const int Iy = srcpp[0] - srcp[0]; + x2[0] = ( Ix * Ix ) >> 1; + y2[0] = ( Iy * Iy ) >> 1; + xy[0] = ( Ix * Iy ) >> 1; + } + for( x = 1; x < width - 1; ++x ) + { + const int Ix = srcp[x+1] - srcp[x-1]; + const int Iy = srcpp[x] - srcp[x]; + x2[x] = ( Ix * Ix ) >> 1; + y2[x] = ( Iy * Iy ) >> 1; + xy[x] = ( Ix * Iy ) >> 1; + } + { + const int Ix = srcp[x] - srcp[x-1]; + const int Iy = srcpp[x] - srcp[x]; + x2[x] = ( Ix * Ix ) >> 1; + y2[x] = ( Iy * Iy ) >> 1; + xy[x] = ( Ix * Iy ) >> 1; + } +} + +/** + * Filters junctions and corners for the output image + * @param x2 Pointer to the x/x derivatives + * @param y2 Pointer to the y/y derivatives + * @param xy Pointer to the x/y derivatives + * @param pitch Stride of the source field plane from which the derivatives were calculated + * @param mskp Pointer to the edge direction mask + * @param msk_pitch Stride of mskp + * @param dstp Pointer to the output image being filtered in place + * @param dst_pitch Stride of dstp + * @param height Height of the full-frame output plane + * @param width Width of dstp bitmap rows, as opposed to the padded stride in dst_pitch + * @param field Field to filter + */ +void eedi2_post_process_corner( int *x2, int *y2, int *xy, const int pitch, uint8_t * mskp, int msk_pitch, uint8_t * dstp, int dst_pitch, int height, int width, int field ) +{ + mskp += ( 8 - field ) * msk_pitch; + dstp += ( 8 - field ) * dst_pitch; + unsigned char * dstpp = dstp - dst_pitch; + unsigned char * dstpn = dstp + dst_pitch; + x2 += pitch * 3; + y2 += pitch * 3; + xy += pitch * 3; + int *x2n = x2 + pitch; + int *y2n = y2 + pitch; + int *xyn = xy + pitch; + int x, y; + + for( y = 8 - field; y < height - 7; y += 2 ) + { + for( x = 4; x < width - 4; ++x ) + { + if( mskp[x] == 255 || mskp[x] == 128 ) continue; + const int c1 = (int)( x2[x] * y2[x] - xy[x] * xy[x] - 0.09 * + ( x2[x] + y2[x] ) * ( x2[x] + y2[x] ) ); + const int c2 = (int)( x2n[x] * y2n[x] - xyn[x]* xyn[x] - 0.09 * + ( x2n[x] + y2n[x] ) * ( x2n[x] + y2n[x] ) ); + if (c1 > 775 || c2 > 775) + dstp[x] = ( dstpp[x] + dstpn[x] + 1 ) >> 1; + } + mskp += msk_pitch * 2; + dstpp += dst_pitch * 2; + dstp += dst_pitch * 2; + dstpn += dst_pitch * 2; + x2 += pitch; + x2n += pitch; + y2 += pitch; + y2n += pitch; + xy += pitch; + xyn += pitch; + } +} |