diff options
author | jbrjake <[email protected]> | 2007-07-16 17:41:26 +0000 |
---|---|---|
committer | jbrjake <[email protected]> | 2007-07-16 17:41:26 +0000 |
commit | d2287c205b2d116cfc26765e40031f43f079a1fd (patch) | |
tree | 3aa4906b65a5a3aac04451e553b614b3824598c4 /contrib/patch-x264-aq.patch | |
parent | 82ae6b4bc0c502aacea3dd17b8d5e1ac5b22c04b (diff) |
Updates x264 to revision 665 and applies Haali's adaptive quantizer patch, creating two new advanced options: aq-strength and aq-sensitivity.
git-svn-id: svn://svn.handbrake.fr/HandBrake/trunk@699 b64f7644-9d1e-0410-96f1-a4d463321fa5
Diffstat (limited to 'contrib/patch-x264-aq.patch')
-rw-r--r-- | contrib/patch-x264-aq.patch | 239 |
1 files changed, 239 insertions, 0 deletions
diff --git a/contrib/patch-x264-aq.patch b/contrib/patch-x264-aq.patch new file mode 100644 index 000000000..21e424b82 --- /dev/null +++ b/contrib/patch-x264-aq.patch @@ -0,0 +1,239 @@ +Index: encoder/encoder.c
+===================================================================
+--- encoder/encoder.c (revisione 634)
++++ encoder/encoder.c (copia locale)
+@@ -470,6 +470,8 @@
+ if( !h->param.b_cabac ) + h->param.analyse.i_trellis = 0; + h->param.analyse.i_trellis = x264_clip3( h->param.analyse.i_trellis, 0, 2 ); ++ if( h->param.analyse.b_aq && h->param.analyse.f_aq_strength <= 0 ) ++ h->param.analyse.b_aq = 0; + h->param.analyse.i_noise_reduction = x264_clip3( h->param.analyse.i_noise_reduction, 0, 1<<16 ); + + { +Index: encoder/analyse.c
+===================================================================
+--- encoder/analyse.c (revisione 634)
++++ encoder/analyse.c (copia locale)
+@@ -29,6 +29,7 @@
+ #include <unistd.h> + + #include "common/common.h" ++#include "common/cpu.h" + #include "macroblock.h" + #include "me.h" + #include "ratecontrol.h" +@@ -2026,8 +2027,73 @@
+ } + } + ++static void x264_add_dctq(int16_t dct[8][8], int *p_total) { ++ int i, t = 0; ++ int16_t *p = &dct[0][0]; + ++ for (i = 1; i < 64; ++i) ++ t += abs(p[i]) * x264_dct8_weight_tab[i]; ++ ++ *p_total += t; ++} ++ + /***************************************************************************** ++ * x264_adaptive_quant: ++ * check if mb is "flat", i.e. has most energy in low frequency components, and ++ * adjust qp down if it is ++ *****************************************************************************/ ++void x264_adaptive_quant( x264_t *h, x264_mb_analysis_t *a ) ++{ ++ DECLARE_ALIGNED( static uint8_t, zero[FDEC_STRIDE*8], 16 ); ++ ++ int16_t dct[8][8]; ++ int total = 0; ++ int i_qp = h->mb.i_qp, i_qp_adj; ++ float fc; ++ ++ if( i_qp <= 10 ) /* AQ is probably not needed at such low QP */ ++ return; ++ ++ if( h->pixf.sad[PIXEL_16x16](h->mb.pic.p_fenc[0], FENC_STRIDE, zero, 16) > 64*16*16 ) ++ { /* light places */ ++ if( h->pixf.count_8x8(h->mb.pic.p_fenc[1], FENC_STRIDE, 0x81818181) < 40 ) ++ /* not enough "blue" pixels */ ++ return; ++ ++ if( h->pixf.count_8x8(h->mb.pic.p_fenc[2], FENC_STRIDE, 0x87878787) > 24 ) ++ /* too many "red" pixels */ ++ return; ++ } ++ ++ h->dctf.sub8x8_dct8( dct, h->mb.pic.p_fenc[0], zero ); ++ x264_add_dctq( dct, &total ); ++ h->dctf.sub8x8_dct8( dct, h->mb.pic.p_fenc[0] + 8, zero ); ++ x264_add_dctq( dct, &total ); ++ h->dctf.sub8x8_dct8( dct, h->mb.pic.p_fenc[0] + 8*FENC_STRIDE, zero ); ++ x264_add_dctq( dct, &total ); ++ h->dctf.sub8x8_dct8( dct, h->mb.pic.p_fenc[0] + 8*FENC_STRIDE + 8, zero ); ++ x264_add_dctq( dct, &total ); ++ ++ if( total == 0 ) /* sum is 0, nothing to do */ ++ return; ++ ++ x264_cpu_restore( h->param.cpu ); ++ ++ fc = (float)expf(-5e-13 * total * total); ++ ++ //printf("AQ: %d %.3f\n", total, fc); ++ /* the function is chosen such that it stays close to 0 in almost all ++ * range of 0..1, and rapidly goes up to 1 near 1.0 */ ++ i_qp_adj = (int)(i_qp * h->param.analyse.f_aq_strength / pow(2 - fc, h->param.analyse.f_aq_sensitivity)); ++ ++ /* don't adjust by more than this amount */ ++ i_qp_adj = X264_MIN(i_qp_adj, i_qp/2); ++ ++ h->mb.i_qp = a->i_qp = i_qp - i_qp_adj; ++ h->mb.i_chroma_qp = i_chroma_qp_table[x264_clip3( h->mb.i_qp + h->pps->i_chroma_qp_index_offset, 0, 51 )]; ++} ++ ++/***************************************************************************** + * x264_macroblock_analyse: + *****************************************************************************/ + void x264_macroblock_analyse( x264_t *h ) +@@ -2039,6 +2105,10 @@
+ /* init analysis */ + x264_mb_analyse_init( h, &analysis, x264_ratecontrol_qp( h ) ); + ++ /* try to do adaptive quantization */ ++ if( h->param.analyse.b_aq ) ++ x264_adaptive_quant( h, &analysis); ++ + /*--------------------------- Do the analysis ---------------------------*/ + if( h->sh.i_type == SLICE_TYPE_I ) + { +Index: x264.c
+===================================================================
+--- x264.c (revisione 634)
++++ x264.c (copia locale)
+@@ -253,6 +253,12 @@
+ " - 2: enabled on all mode decisions\n", defaults->analyse.i_trellis ); + H0( " --no-fast-pskip Disables early SKIP detection on P-frames\n" ); + H0( " --no-dct-decimate Disables coefficient thresholding on P-frames\n" ); ++ H0( " --aq-strength <float> Amount to adjust QP per MB [%.1f]\n" ++ " 0.0: no AQ\n" ++ " 1.1: strong AQ\n", defaults->analyse.f_aq_strength ); ++ H0( " --aq-sensitivity <float> \"Flatness\" threshold to trigger AQ [%.1f]\n" ++ " 5: applies to almost all blocks\n" ++ " 22: only flat blocks\n", defaults->analyse.f_aq_sensitivity ); + H0( " --nr <integer> Noise reduction [%d]\n", defaults->analyse.i_noise_reduction ); + H1( "\n" ); + H1( " --deadzone-inter <int> Set the size of the inter luma quantization deadzone [%d]\n", defaults->analyse.i_luma_deadzone[0] ); +@@ -416,6 +422,8 @@
+ { "trellis", required_argument, NULL, 't' }, + { "no-fast-pskip", no_argument, NULL, 0 }, + { "no-dct-decimate", no_argument, NULL, 0 }, ++ { "aq-strength", required_argument, NULL, 0 }, ++ { "aq-sensitivity", required_argument, NULL, 0 }, + { "deadzone-inter", required_argument, NULL, '0' }, + { "deadzone-intra", required_argument, NULL, '0' }, + { "level", required_argument, NULL, 0 }, +Index: common/pixel.c
+===================================================================
+--- common/pixel.c (revisione 634)
++++ common/pixel.c (copia locale)
+@@ -215,7 +215,17 @@
+ PIXEL_SATD_C( x264_pixel_satd_4x8, 4, 8 ) + PIXEL_SATD_C( x264_pixel_satd_4x4, 4, 4 ) + ++static int x264_pixel_count_8x8( uint8_t *pix1, int i_pix1, uint32_t threshold ) ++{ ++ int i, j, sum = 0; ++ ++ for ( i = 0; i < 8; ++i, pix1 += i_pix1 ) ++ for ( j = 0; j < 8; ++j ) ++ sum += pix1[j] > (uint8_t)threshold; + ++ return sum; ++} ++ + /**************************************************************************** + * pixel_sa8d_WxH: sum of 8x8 Hadamard transformed differences + ****************************************************************************/ +@@ -469,6 +479,8 @@
+ pixf->ads[PIXEL_16x16] = pixel_ads4; + pixf->ads[PIXEL_16x8] = pixel_ads2; + pixf->ads[PIXEL_8x8] = pixel_ads1; ++ ++ pixf->count_8x8 = x264_pixel_count_8x8; + + #ifdef HAVE_MMX + if( cpu&X264_CPU_MMX ) +Index: common/pixel.h
+===================================================================
+--- common/pixel.h (revisione 634)
++++ common/pixel.h (copia locale)
+@@ -26,6 +26,7 @@
+ + typedef int (*x264_pixel_cmp_t) ( uint8_t *, int, uint8_t *, int ); + typedef int (*x264_pixel_cmp_pde_t) ( uint8_t *, int, uint8_t *, int, int ); ++typedef int (*x264_pixel_count_t) ( uint8_t *, int, uint32_t ); + typedef void (*x264_pixel_cmp_x3_t) ( uint8_t *, uint8_t *, uint8_t *, uint8_t *, int, int[3] ); + typedef void (*x264_pixel_cmp_x4_t) ( uint8_t *, uint8_t *, uint8_t *, uint8_t *, uint8_t *, int, int[4] ); + +@@ -84,6 +85,7 @@
+ /* multiple parallel calls to sad. */ + x264_pixel_cmp_x3_t sad_x3[7]; + x264_pixel_cmp_x4_t sad_x4[7]; ++ x264_pixel_count_t count_8x8; + + /* abs-diff-sum for successive elimination. + * may round width up to a multiple of 8. */ +Index: common/common.c
+===================================================================
+--- common/common.c (revisione 634)
++++ common/common.c (copia locale)
+@@ -125,6 +125,9 @@
+ param->analyse.i_chroma_qp_offset = 0; + param->analyse.b_fast_pskip = 1; + param->analyse.b_dct_decimate = 1; ++ param->analyse.b_aq = 0; ++ param->analyse.f_aq_strength = 0.0; ++ param->analyse.f_aq_sensitivity = 15; + param->analyse.i_luma_deadzone[0] = 21; + param->analyse.i_luma_deadzone[1] = 11; + param->analyse.b_psnr = 1; +@@ -457,6 +460,13 @@
+ p->analyse.b_fast_pskip = atobool(value); + OPT("dct-decimate") + p->analyse.b_dct_decimate = atobool(value); ++ OPT("aq-strength") ++ { ++ p->analyse.f_aq_strength = atof(value); ++ p->analyse.b_aq = (p->analyse.f_aq_strength > 0.0); ++ } ++ OPT("aq-sensitivity") ++ p->analyse.f_aq_sensitivity = atof(value); + OPT("deadzone-inter") + p->analyse.i_luma_deadzone[0] = atoi(value); + OPT("deadzone-intra") +@@ -936,6 +946,9 @@
+ s += sprintf( s, " zones" ); + } + ++ if( p->analyse.b_aq ) ++ s += sprintf( s, " aq=1:%.1f:%.1f", p->analyse.f_aq_strength, p->analyse.f_aq_sensitivity ); ++ + return buf; + } + +Index: x264.h
+===================================================================
+--- x264.h (revisione 634)
++++ x264.h (copia locale)
+@@ -223,6 +223,9 @@
+ int i_trellis; /* trellis RD quantization */ + int b_fast_pskip; /* early SKIP detection on P-frames */ + int b_dct_decimate; /* transform coefficient thresholding on P-frames */ ++ int b_aq; /* psy adaptive QP */ ++ float f_aq_strength; ++ float f_aq_sensitivity; + int i_noise_reduction; /* adaptive pseudo-deadzone */ + + /* the deadzone size that will be used in luma quantization */ |