libhb: New denoiser, nlmeans.

Non-local means averages multiple patches of similar pixels together, preserving similarities and attenuating variance (usually noise). This is typically more effective than lowpass and more faithfully restores the appearance of structure and detail found in the original source, especially in the high frequency range. Parameters for origin patch weight tuning and pre-filtering further improve on the original algorithm. git-svn-id: svn://svn.handbrake.fr/HandBrake/trunk@6216 b64f7644-9d1e-0410-96f1-a4d463321fa5
author: bradleys <[email protected]> 2014-06-19 21:44:37 +0000
committer: bradleys <[email protected]> 2014-06-19 21:44:37 +0000
commit: 7fba1c6ad31aa1002624223ef34b612efa8262f4 (patch)
tree: ee459af7c2ab4ef7fe01e17a532bf5f6767f73cf /libhb
parent: 80a124ff2567ac45b26a606d425420a1ee590506 (diff)
4 files changed, 748 insertions, 0 deletions
diff --git a/libhb/common.c b/libhb/common.c
index 60b926d94..6ba81f762 100644
--- a/libhb/common.c
+++ b/libhb/common.c
@@ -3247,6 +3247,10 @@ hb_filter_object_t * hb_filter_init( int filter_id )
             filter = &hb_filter_denoise;
             break;
 
+        case HB_FILTER_NLMEANS:
+            filter = &hb_filter_nlmeans;
+            break;
+
         case HB_FILTER_RENDER_SUB:
             filter = &hb_filter_render_sub;
             break;
diff --git a/libhb/common.h b/libhb/common.h
index 778918db2..2a57b0534 100644
--- a/libhb/common.h
+++ b/libhb/common.h
@@ -1210,6 +1210,7 @@ enum
     // Filters that must operate on the original source image are next
     HB_FILTER_DEBLOCK,
     HB_FILTER_DENOISE,
+    HB_FILTER_NLMEANS,
     HB_FILTER_RENDER_SUB,
     HB_FILTER_CROP_SCALE,
 
diff --git a/libhb/internal.h b/libhb/internal.h
index e3b81cd0c..2f7cbacc1 100644
--- a/libhb/internal.h
+++ b/libhb/internal.h
@@ -433,6 +433,7 @@ extern hb_filter_object_t hb_filter_detelecine;
 extern hb_filter_object_t hb_filter_deinterlace;
 extern hb_filter_object_t hb_filter_deblock;
 extern hb_filter_object_t hb_filter_denoise;
+extern hb_filter_object_t hb_filter_nlmeans;
 extern hb_filter_object_t hb_filter_decomb;
 extern hb_filter_object_t hb_filter_rotate;
 extern hb_filter_object_t hb_filter_crop_scale;
diff --git a/libhb/nlmeans.c b/libhb/nlmeans.c
new file mode 100644
index 000000000..ad3f1d393
--- /dev/null
+++ b/libhb/nlmeans.c
@@ -0,0 +1,742 @@
+/* nlmeans.c
+
+   Copyright (c) 2013 Dirk Farin
+   Copyright (c) 2003-2014 HandBrake Team
+   This file is part of the HandBrake source code
+   Homepage: <http://handbrake.fr/>.
+   It may be used under the terms of the GNU General Public License v2.
+   For full terms see the file COPYING file or visit http://www.gnu.org/licenses/gpl-2.0.html
+ */
+
+/* Usage
+ *
+ * Parameters:
+ *     lumaY_strength   : lumaY_origin_tune   : lumaY_patch_size   : lumaY_range   : lumaY_frames   : lumaY_prefilter   :
+ *     chromaB_strength : chromaB_origin_tune : chromaB_patch_size : chromaB_range : chromaB_frames : chromaB_prefilter :
+ *     chromaR_strength : chromaR_origin_tune : chromaR_patch_size : chromaR_range : chromaR_frames : chromaR_prefilter
+ *
+ * Defaults:
+ *     8:1:7:3:2:0 for each channel (equivalent to 8:1:7:3:2:0:8:1:7:3:2:0:8:1:7:3:2:0)
+ *
+ * Parameters cascade, e.g. 6:0.8:7:3:3:0:4:1 sets:
+ *     strength 6, origin tune 0.8 for luma
+ *     patch size 7, range 3, frames 3, prefilter 0 for all channels
+ *     strength 4, origin tune 1 for both chroma channels
+ *
+ * Strength is relative and must be adjusted; ALL parameters affect overall strength.
+ * Lower origin tune improves results for noisier input or animation (film 0.5-1, animation 0.15-0.5).
+ * Large patch size (>9) may greatly reduce quality by clobbering detail.
+ * Larger search range increases quality; however, computation time increases exponentially.
+ * Large number of frames (film >3, animation >6) may cause temporal smearing.
+ * Prefiltering can potentially improve weight decisions, yielding better results for difficult sources.
+ *
+ * Prefilter enum combos:
+ *     1: Mean 3x3
+ *     2: Mean 5x5
+ *     3: Mean 5x5 (overrides Mean 3x3)
+ *   257: Mean 3x3 reduced by 25%
+ *   258: Mean 5x5 reduced by 25%
+ *   513: Mean 3x3 reduced by 50%
+ *   514: Mean 5x5 reduced by 50%
+ *   769: Mean 3x3 reduced by 75%
+ *   770: Mean 5x5 reduced by 75%
+ *  1025: Mean 3x3 plus edge boost (restores lost edge detail)
+ *  1026: Mean 5x5 plus edge boost
+ *  1281: Mean 3x3 reduced by 25% plus edge boost
+ *        etc...
+ *  2049: Mean 3x3 passthru (NL-means off, prefilter is the output)
+ *        etc...
+ *  3329: Mean 3x3 reduced by 25% plus edge boost, passthru
+ *        etc...
+ */
+
+#include "hb.h"
+#include "hbffmpeg.h"
+
+#define NLMEANS_STRENGTH_LUMA_DEFAULT      8
+#define NLMEANS_STRENGTH_CHROMA_DEFAULT    8
+#define NLMEANS_ORIGIN_TUNE_LUMA_DEFAULT   1
+#define NLMEANS_ORIGIN_TUNE_CHROMA_DEFAULT 1
+#define NLMEANS_PATCH_SIZE_LUMA_DEFAULT    7
+#define NLMEANS_PATCH_SIZE_CHROMA_DEFAULT  7
+#define NLMEANS_RANGE_LUMA_DEFAULT         3
+#define NLMEANS_RANGE_CHROMA_DEFAULT       3
+#define NLMEANS_FRAMES_LUMA_DEFAULT        2
+#define NLMEANS_FRAMES_CHROMA_DEFAULT      2
+#define NLMEANS_PREFILTER_LUMA_DEFAULT     0
+#define NLMEANS_PREFILTER_CHROMA_DEFAULT   0
+
+#define NLMEANS_PREFILTER_MODE_MEAN3X3       1
+#define NLMEANS_PREFILTER_MODE_MEAN5X5       2
+#define NLMEANS_PREFILTER_MODE_RESERVED4     4 // Reserved
+#define NLMEANS_PREFILTER_MODE_RESERVED8     8 // Reserved
+#define NLMEANS_PREFILTER_MODE_RESERVED16   16 // Reserved
+#define NLMEANS_PREFILTER_MODE_RESERVED32   32 // Reserved
+#define NLMEANS_PREFILTER_MODE_RESERVED64   64 // Reserved
+#define NLMEANS_PREFILTER_MODE_RESERVED128 128 // Reserved
+#define NLMEANS_PREFILTER_MODE_REDUCE25    256
+#define NLMEANS_PREFILTER_MODE_REDUCE50    512
+#define NLMEANS_PREFILTER_MODE_EDGEBOOST  1024
+#define NLMEANS_PREFILTER_MODE_PASSTHRU   2048
+
+#define NLMEANS_FRAMES_MAX 32
+#define NLMEANS_EXPSIZE    128
+
+typedef struct
+{
+    uint8_t *mem;
+    uint8_t *mem_pre;
+    uint8_t *image;
+    uint8_t *image_pre;
+    int w;
+    int h;
+    int border;
+} BorderedPlane;
+
+struct PixelSum
+{
+    float weight_sum;
+    float pixel_sum;
+};
+
+struct hb_filter_private_s
+{
+    double strength[3];    // averaging weight decay, larger produces smoother output
+    double origin_tune[3]; // weight tuning for origin patch, 0.00..1.00
+    int    patch_size[3];  // pixel context region width  (must be odd)
+    int    range[3];       // spatial search window width (must be odd)
+    int    frames[3];      // temporal search depth in frames
+    int    prefilter[3];   // prefilter mode, can improve weight analysis
+
+    BorderedPlane frame_tmp[3][32];
+    int           frame_ready[3][32];
+};
+
+static int hb_nlmeans_init(hb_filter_object_t *filter,
+                           hb_filter_init_t   *init);
+
+static int hb_nlmeans_work(hb_filter_object_t *filter,
+                           hb_buffer_t **buf_in,
+                           hb_buffer_t **buf_out);
+
+static void hb_nlmeans_close(hb_filter_object_t *filter);
+
+hb_filter_object_t hb_filter_nlmeans =
+{
+    .id            = HB_FILTER_NLMEANS,
+    .enforce_order = 1,
+    .name          = "Denoise (nlmeans)",
+    .settings      = NULL,
+    .init          = hb_nlmeans_init,
+    .work          = hb_nlmeans_work,
+    .close         = hb_nlmeans_close,
+};
+
+static void nlmeans_border(uint8_t *src,
+                           int w,
+                           int h,
+                           int border)
+{
+
+    uint8_t *image = src + border + w*border;
+    int iw = w - 2*border;
+    int ih = h - 2*border;
+
+    // Create faux borders using edge pixels
+    for (int y = 0; y < ih; y++)
+    {
+        for (int x = 0; x < border; x++)
+        {
+            *(image + y*w - x - 1)  = *(image + y*w + x);
+            *(image + y*w + x + iw) = *(image + y*w - x + (iw-1));
+        }
+    }
+    for (int y = 0; y < border; y++)
+    {
+        memcpy(image - border -  (y+1)*w, image - border +        y*w, w);
+        memcpy(image - border + (y+ih)*w, image - border + (ih-y-1)*w, w);
+    }
+
+}
+
+static void nlmeans_deborder(uint8_t *src,
+                             uint8_t *dst,
+                             int w,
+                             int h,
+                             int border)
+{
+
+    uint8_t *image = src + border + w*border;
+    int iw = w - 2*border;
+    int ih = h - 2*border;
+
+    // Copy main image
+    for (int y = 0; y < ih; y++)
+    {
+        memcpy(dst + y*iw, image + y*w, iw);
+    }
+
+}
+
+static void nlmeans_alloc(uint8_t *src,
+                          int src_w,
+                          int src_h,
+                          BorderedPlane *dst,
+                          int dst_w,
+                          int dst_h,
+                          int border)
+{
+
+    uint8_t *mem   = malloc(dst_w * dst_h * sizeof(uint8_t));
+    uint8_t *image = mem + border + dst_w*border;
+
+    // Copy main image
+    for (int y = 0; y < src_h; y++)
+    {
+        memcpy(image + y*dst_w, src + y*src_w, src_w);
+    }
+
+    dst->mem       = mem;
+    dst->image     = image;
+    dst->w         = dst_w;
+    dst->h         = dst_h;
+    dst->border    = border;
+
+    nlmeans_border(dst->mem, dst->w, dst->h, dst->border);
+    dst->mem_pre   = dst->mem;
+    dst->image_pre = dst->image;
+
+}
+
+static void nlmeans_filter_mean(uint8_t *src,
+                                uint8_t *dst,
+                                int w,
+                                int h,
+                                int border,
+                                int size)
+{
+
+    // Mean filter
+    int iw = w - 2*border;
+    int ih = h - 2*border;
+    int offset_min = -((size - 1) /2);
+    int offset_max =   (size + 1) /2;
+    uint16_t pixel_sum;
+    double pixel_weight = 1.0 / (size * size);
+    for (int y = 0; y < ih; y++)
+    {
+        for (int x = 0; x < iw; x++)
+        {
+            pixel_sum = 0;
+            for (int k = offset_min; k < offset_max; k++)
+            {
+                for (int j = offset_min; j < offset_max; j++)
+                {
+                    pixel_sum = pixel_sum + *(src + w*(y+j) + (x+k));
+                }
+            }
+            *(dst + w*y + x) = (uint8_t)(pixel_sum * pixel_weight);
+        }
+    }
+
+}
+
+static void nlmeans_filter_edgeboost(uint8_t *src,
+                                     uint8_t *dst,
+                                     int w,
+                                     int h,
+                                     int border)
+{
+
+    int iw = w - 2*border;
+    int ih = h - 2*border;
+
+    // Custom kernel
+    int kernel_size = 3;
+    int kernel[3][3] = {{-31, 0, 31},
+                        {-44, 0, 44},
+                        {-31, 0, 31}};
+    double kernel_coef = 1.0 / 27.0;
+
+    // Detect edges
+    int offset_min = -((kernel_size - 1) /2);
+    int offset_max =   (kernel_size + 1) /2;
+    uint16_t pixel1;
+    uint16_t pixel2;
+    uint8_t *mask = malloc(iw * ih * sizeof(uint8_t));
+    for (int y = 0; y < ih; y++)
+    {
+        for (int x = 0; x < iw; x++)
+        {
+            pixel1 = 0;
+            pixel2 = 0;
+            for (int k = offset_min; k < offset_max; k++)
+            {
+                for (int j = offset_min; j < offset_max; j++)
+                {
+                    pixel1 += kernel[j+1][k+1] * *(src + w*(y+j) + (x+k));
+                    pixel2 += kernel[k+1][j+1] * *(src + w*(y+j) + (x+k));
+                }
+            }
+            pixel1 = pixel1 > 0 ? pixel1 : -pixel1;
+            pixel2 = pixel2 > 0 ? pixel2 : -pixel2;
+            pixel1 = (uint16_t)(((double)pixel1 * kernel_coef) + 128);
+            pixel2 = (uint16_t)(((double)pixel2 * kernel_coef) + 128);
+            *(mask + iw*y + x) = (uint8_t)(pixel1 + pixel2);
+            if (*(mask + iw*y + x) > 160)
+            {
+                *(dst + w*y + x) = (3 * *(src + w*y + x) + 1 * *(dst + w*y + x)) /4;
+                //*(dst + w*y + x) = 235;
+            }
+            else if (*(mask + iw*y + x) > 88)
+            {
+                *(dst + w*y + x) = (2 * *(src + w*y + x) + 3 * *(dst + w*y + x)) /5;
+                //*(dst + w*y + x) = 128;
+            }
+            else
+            {
+                //*(dst + w*y + x) = 16;
+            }
+        }
+    }
+
+    free(mask);
+
+}
+
+static void nlmeans_prefilter(BorderedPlane *src,
+                              int filter_type)
+{
+
+    if (filter_type & NLMEANS_PREFILTER_MODE_MEAN3X3 ||
+        filter_type & NLMEANS_PREFILTER_MODE_MEAN5X5)
+    {
+
+        // Source image
+        uint8_t *mem   = src->mem;
+        uint8_t *image = src->image;
+        int w          = src->w;
+        int h          = src->h;
+        int border     = src->border;
+
+        // Duplicate plane
+        uint8_t *mem_pre = malloc(w * h * sizeof(uint8_t));
+        uint8_t *image_pre = mem_pre + border + w*border;
+        for (int y = 0; y < h; y++)
+        {
+            memcpy(mem_pre + y*w, mem + y*w, w);
+        }
+
+        // Filter plane; should already have at least 2px extra border on each side
+        if (filter_type & NLMEANS_PREFILTER_MODE_MEAN5X5)
+        {
+            // Mean 5x5
+            nlmeans_filter_mean(image, image_pre, w, h, border, 5);
+        }
+        else if (filter_type & NLMEANS_PREFILTER_MODE_MEAN3X3)
+        {
+            // Mean 3x3
+            nlmeans_filter_mean(image, image_pre, w, h, border, 3);
+        }
+
+        // Restore edges
+        if (filter_type & NLMEANS_PREFILTER_MODE_EDGEBOOST)
+        {
+            nlmeans_filter_edgeboost(image, image_pre, w, h, border);
+        }
+
+        // Blend source and destination for lesser effect
+        int wet = 1;
+        int dry = 0;
+        if (filter_type & NLMEANS_PREFILTER_MODE_REDUCE50 &&
+            filter_type & NLMEANS_PREFILTER_MODE_REDUCE25)
+        {
+            wet = 1;
+            dry = 3;
+        }
+        else if (filter_type & NLMEANS_PREFILTER_MODE_REDUCE50)
+        {
+            wet = 1;
+            dry = 1;
+        }
+        else if (filter_type & NLMEANS_PREFILTER_MODE_REDUCE25)
+        {
+            wet = 3;
+            dry = 1;
+        }
+        if (dry > 0)
+        {
+            for (int y = 0; y < h; y++)
+            {
+                for (int x = 0; x < w; x++)
+                {
+                    *(mem_pre + w*y + x) = (uint8_t)((wet * *(mem_pre + w*y + x) + dry * *(mem + w*y + x)) / (wet + dry));
+                }
+            }
+        }
+
+        // Assign result
+        src->mem_pre   = mem_pre;
+        src->image_pre = image_pre;
+
+        // Recreate borders
+        nlmeans_border(mem_pre, w, h, border);
+
+    }
+
+}
+
+static void nlmeans_plane(BorderedPlane *plane_tmp,
+                          int *plane_ready,
+                          uint8_t *dst,
+                          int w,
+                          int h,
+                          double h_param,
+                          double origin_tune,
+                          int n,
+                          int r)
+{
+
+    int n_half = (n-1) /2;
+    int r_half = (r-1) /2;
+
+    // Source image
+    uint8_t *src     = plane_tmp[0].image;
+    uint8_t *src_pre = plane_tmp[0].image_pre;
+    int src_w        = plane_tmp[0].w;
+
+    // Allocate temporary pixel sums
+    struct PixelSum *tmp_data = calloc(w * h, sizeof(struct PixelSum));
+
+    // Allocate integral image
+    int integral_stride = w + 2*16;
+    uint32_t *integral_mem = malloc(integral_stride * (h+1) * sizeof(uint32_t));
+    uint32_t *integral     = integral_mem + integral_stride + 16;
+
+    // Precompute exponential table
+    float exptable[NLMEANS_EXPSIZE];
+    const float weight_factor       = 1.0/n/n / (h_param * h_param);
+    const float min_weight_in_table = 0.0005;
+    const float stretch             = NLMEANS_EXPSIZE / (-log(min_weight_in_table));
+    const float weight_fact_table   = weight_factor * stretch;
+    const int   diff_max            = NLMEANS_EXPSIZE / weight_fact_table;
+    for (int i = 0; i < NLMEANS_EXPSIZE; i++)
+    {
+        exptable[i] = exp(-i/stretch);
+    }
+    exptable[NLMEANS_EXPSIZE-1] = 0;
+
+    // Iterate through available frames
+    for (int plane_index = 0; plane_ready[plane_index] == 1; plane_index++)
+    {
+
+        // Compare image
+        uint8_t *compare     = plane_tmp[plane_index].image;
+        uint8_t *compare_pre = plane_tmp[plane_index].image_pre;
+        int compare_w        = plane_tmp[plane_index].w;
+
+        // Iterate through all displacements
+        for (int dy = -r_half; dy <= r_half; dy++)
+        {
+            for (int dx = -r_half; dx <= r_half; dx++)
+            {
+
+                // Apply special weight tuning to origin patch
+                if (dx == 0 && dy == 0 && plane_index == 0)
+                {
+                    // TODO: Parallelize this
+                    for (int y = n_half; y < h-n + n_half; y++)
+                    {
+                        for (int x = n_half; x < w-n + n_half; x++)
+                        {
+                            tmp_data[y*w + x].weight_sum += origin_tune;
+                            tmp_data[y*w + x].pixel_sum  += origin_tune * src[y*src_w + x];
+                        }
+                    }
+                    continue;
+                }
+
+                // Build integral
+                memset(integral-1 - integral_stride, 0, (w+1) * sizeof(uint32_t));
+                for (int y = 0; y < h; y++)
+                {
+                    const uint8_t *p1 = src_pre + y*src_w;
+                    const uint8_t *p2 = compare_pre + (y+dy)*compare_w + dx;
+                    uint32_t *out = integral + (y*integral_stride) - 1;
+
+                    *out++ = 0;
+
+                    for (int x = 0; x < w; x++)
+                    {
+                        int diff = *p1++ - *p2++;
+                        *out = *(out-1) + diff * diff;
+                        out++;
+                    }
+
+                    if (y > 0)
+                    {
+                        out = integral + y*integral_stride;
+
+                        for (int x = 0; x < w; x++)
+                        {
+                            *out += *(out - integral_stride);
+                            out++;
+                        }
+                    }
+                }
+
+                // Average displacement
+                // TODO: Parallelize this
+                for (int y = 0; y <= h-n; y++)
+                {
+                    const uint32_t *integral_ptr1 = integral + (y  -1)*integral_stride - 1;
+                    const uint32_t *integral_ptr2 = integral + (y+n-1)*integral_stride - 1;
+
+                    for (int x = 0; x <= w-n; x++)
+                    {
+                        int xc = x + n_half;
+                        int yc = y + n_half;
+
+                        // Difference between patches
+                        int diff = (uint32_t)(integral_ptr2[n] - integral_ptr2[0] - integral_ptr1[n] + integral_ptr1[0]);
+
+                        // Sum pixel with weight
+                        if (diff < diff_max)
+                        {
+                            int diffidx = diff * weight_fact_table;
+
+                            //float weight = exp(-diff*weightFact);
+                            float weight = exptable[diffidx];
+
+                            tmp_data[yc*w + xc].weight_sum += weight;
+                            tmp_data[yc*w + xc].pixel_sum  += weight * compare[(yc+dy)*compare_w + xc + dx];
+                        }
+
+                        integral_ptr1++;
+                        integral_ptr2++;
+                    }
+                }
+            }
+        }
+    }
+
+    // Copy edges
+    for (int y = 0; y < h; y++)
+    {
+        for (int x = 0; x < n_half; x++)
+        {
+            *(dst + y*w + x)         = *(src + y*src_w - x - 1);
+            *(dst + y*w - x + (w-1)) = *(src + y*src_w + x + w);
+        }
+    }
+    for (int y = 0; y < n_half; y++)
+    {
+        memcpy(dst +       y*w, src - (y+1)*src_w, w);
+        memcpy(dst + (h-y-1)*w, src + (y+h)*src_w, w);
+    }
+
+    // Copy main image
+    uint8_t result;
+    for (int y = n_half; y < h-n_half; y++)
+    {
+        for (int x = n_half; x < w-n_half; x++)
+        {
+            result = (uint8_t)(tmp_data[y*w + x].pixel_sum / tmp_data[y*w + x].weight_sum);
+            *(dst + y*w + x) = result ? result : *(src + y*src_w + x);
+        }
+    }
+
+    free(tmp_data);
+    free(integral_mem);
+
+}
+
+static int hb_nlmeans_init(hb_filter_object_t *filter,
+                           hb_filter_init_t *init)
+{
+    filter->private_data = calloc(sizeof(struct hb_filter_private_s), 1);
+    hb_filter_private_t *pv = filter->private_data;
+
+    // Mark parameters unset
+    for (int c = 0; c < 3; c++)
+    {
+        pv->strength[c]    = -1;
+        pv->origin_tune[c] = -1;
+        pv->patch_size[c]  = -1;
+        pv->range[c]       = -1;
+        pv->frames[c]      = -1;
+        pv->prefilter[c]   = -1;
+    }
+
+    // Read user parameters
+    if (filter->settings != NULL)
+    {
+        sscanf(filter->settings, "%lf:%lf:%d:%d:%d:%d:%lf:%lf:%d:%d:%d:%d:%lf:%lf:%d:%d:%d:%d",
+               &pv->strength[0], &pv->origin_tune[0], &pv->patch_size[0], &pv->range[0], &pv->frames[0], &pv->prefilter[0],
+               &pv->strength[1], &pv->origin_tune[1], &pv->patch_size[1], &pv->range[1], &pv->frames[1], &pv->prefilter[1],
+               &pv->strength[2], &pv->origin_tune[2], &pv->patch_size[2], &pv->range[2], &pv->frames[2], &pv->prefilter[2]);
+    }
+
+    // Cascade values
+    // Cr not set; inherit Cb. Cb not set; inherit Y. Y not set; defaults.
+    for (int c = 1; c < 3; c++)
+    {
+        if (pv->strength[c]    == -1) { pv->strength[c]    = pv->strength[c-1]; }
+        if (pv->origin_tune[c] == -1) { pv->origin_tune[c] = pv->origin_tune[c-1]; }
+        if (pv->patch_size[c]  == -1) { pv->patch_size[c]  = pv->patch_size[c-1]; }
+        if (pv->range[c]       == -1) { pv->range[c]       = pv->range[c-1]; }
+        if (pv->frames[c]      == -1) { pv->frames[c]      = pv->frames[c-1]; }
+        if (pv->prefilter[c]   == -1) { pv->prefilter[c]   = pv->prefilter[c-1]; }
+    }
+
+    for (int c = 0; c < 3; c++)
+    {
+        // Replace unset values with defaults
+        if (pv->strength[c]    == -1) { pv->strength[c]    = c ? NLMEANS_STRENGTH_LUMA_DEFAULT    : NLMEANS_STRENGTH_CHROMA_DEFAULT; }
+        if (pv->origin_tune[c] == -1) { pv->origin_tune[c] = c ? NLMEANS_ORIGIN_TUNE_LUMA_DEFAULT : NLMEANS_ORIGIN_TUNE_CHROMA_DEFAULT; }
+        if (pv->patch_size[c]  == -1) { pv->patch_size[c]  = c ? NLMEANS_PATCH_SIZE_LUMA_DEFAULT  : NLMEANS_PATCH_SIZE_CHROMA_DEFAULT; }
+        if (pv->range[c]       == -1) { pv->range[c]       = c ? NLMEANS_RANGE_LUMA_DEFAULT       : NLMEANS_RANGE_CHROMA_DEFAULT; }
+        if (pv->frames[c]      == -1) { pv->frames[c]      = c ? NLMEANS_FRAMES_LUMA_DEFAULT      : NLMEANS_FRAMES_CHROMA_DEFAULT; }
+        if (pv->prefilter[c]   == -1) { pv->prefilter[c]   = c ? NLMEANS_PREFILTER_LUMA_DEFAULT   : NLMEANS_PREFILTER_CHROMA_DEFAULT; }
+
+        // Sanitize
+        if (pv->strength[c] < 0)        { pv->strength[c] = 0; }
+        if (pv->origin_tune[c] < 0.01)  { pv->origin_tune[c] = 0.01; } // avoid black artifacts
+        if (pv->origin_tune[c] > 1)     { pv->origin_tune[c] = 1; }
+        if (pv->patch_size[c] % 2 == 0) { pv->patch_size[c]--; }
+        if (pv->patch_size[c] < 1)      { pv->patch_size[c] = 1; }
+        if (pv->range[c] % 2 == 0)      { pv->range[c]--; }
+        if (pv->range[c] < 1)           { pv->range[c] = 1; }
+        if (pv->frames[c] < 1)          { pv->frames[c] = 1; }
+        if (pv->frames[c] > NLMEANS_FRAMES_MAX) { pv->frames[c] = NLMEANS_FRAMES_MAX; }
+        if (pv->prefilter[c] < 0)       { pv->prefilter[c] = 0; }
+
+        // Mark buffer empty
+        for (int f = 0; f < NLMEANS_FRAMES_MAX; f++)
+        {
+            pv->frame_ready[c][f] = 0;
+        }
+    }
+
+    return 0;
+}
+
+static void hb_nlmeans_close(hb_filter_object_t *filter)
+{
+    hb_filter_private_t *pv = filter->private_data;
+
+    if (pv == NULL)
+    {
+        return;
+    }
+
+    for (int c = 0; c < 3; c++)
+    {
+        for (int f = 0; f < pv->frames[c]; f++)
+        {
+            if (pv->frame_tmp[c][f].mem_pre != NULL &&
+                pv->frame_tmp[c][f].mem_pre != pv->frame_tmp[c][f].mem)
+            {
+                free(pv->frame_tmp[c][f].mem_pre);
+                pv->frame_tmp[c][f].mem_pre = NULL;
+            }
+            if (pv->frame_tmp[c][f].mem != NULL)
+            {
+                free(pv->frame_tmp[c][f].mem);
+                pv->frame_tmp[c][f].mem = NULL;
+            }
+        }
+    }
+
+    free(pv);
+    filter->private_data = NULL;
+}
+
+static int hb_nlmeans_work(hb_filter_object_t *filter,
+                           hb_buffer_t **buf_in,
+                           hb_buffer_t **buf_out )
+{
+    hb_filter_private_t *pv = filter->private_data;
+    hb_buffer_t *in = *buf_in, *out;
+
+    if (in->size <= 0)
+    {
+        *buf_out = in;
+        *buf_in  = NULL;
+        return HB_FILTER_DONE;
+    }
+
+    out = hb_video_buffer_init(in->f.width, in->f.height);
+
+    for (int c = 0; c < 3; c++)
+    {
+
+        if (pv->strength[c] == 0)
+        {
+            out->plane[c].data = in->plane[c].data;
+            continue;
+        }
+
+        int frames = pv->frames[c];
+
+        // Release last frame in buffer
+        if (pv->frame_tmp[c][frames-1].mem_pre != NULL &&
+            pv->frame_tmp[c][frames-1].mem_pre != pv->frame_tmp[c][frames-1].mem)
+        {
+            free(pv->frame_tmp[c][frames-1].mem_pre);
+            pv->frame_tmp[c][frames-1].mem_pre = NULL;
+        }
+        if (pv->frame_tmp[c][frames-1].mem != NULL)
+        {
+            free(pv->frame_tmp[c][frames-1].mem);
+            pv->frame_tmp[c][frames-1].mem = NULL;
+        }
+        pv->frame_ready[c][frames-1] = 0;
+
+        // Shift frames in buffer down one level
+        for (int f = frames-1; f > 0; f--)
+        {
+            pv->frame_tmp[c][f]   = pv->frame_tmp[c][f-1];
+            pv->frame_ready[c][f] = pv->frame_ready[c][f-1];
+        }
+
+        // Extend copy of plane with extra border and place in buffer
+        int border = ((pv->range[c] + 2) / 2 + 15) /16*16;
+        int w = in->plane[c].stride + 2*border;
+        int h = in->plane[c].height + 2*border;
+        nlmeans_alloc(in->plane[c].data,
+                      in->plane[c].stride,
+                      in->plane[c].height,
+                      &pv->frame_tmp[c][0],
+                      w,
+                      h,
+                      border);
+        nlmeans_prefilter(&pv->frame_tmp[c][0], pv->prefilter[c]);
+        pv->frame_ready[c][0] = 1;
+
+        if (pv->prefilter[c] & NLMEANS_PREFILTER_MODE_PASSTHRU)
+        {
+            nlmeans_deborder(pv->frame_tmp[c][0].mem_pre, out->plane[c].data, w, h, border);
+            continue;
+        }
+
+        // Process current plane
+        nlmeans_plane(pv->frame_tmp[c],
+                      pv->frame_ready[c],
+                      out->plane[c].data,
+                      in->plane[c].stride,
+                      in->plane[c].height,
+                      pv->strength[c],
+                      pv->origin_tune[c],
+                      pv->patch_size[c],
+                      pv->range[c]);
+
+    }
+
+    out->s = in->s;
+    hb_buffer_move_subs(out, in);
+
+    *buf_out = out;
+
+    return HB_FILTER_OK;
+}
author	bradleys <[email protected]>	2014-06-19 21:44:37 +0000
committer	bradleys <[email protected]>	2014-06-19 21:44:37 +0000
commit	7fba1c6ad31aa1002624223ef34b612efa8262f4 (patch)
tree	ee459af7c2ab4ef7fe01e17a532bf5f6767f73cf /libhb
parent	80a124ff2567ac45b26a606d425420a1ee590506 (diff)