summaryrefslogtreecommitdiffstats
path: root/libhb
diff options
context:
space:
mode:
Diffstat (limited to 'libhb')
-rw-r--r--libhb/common.c4
-rw-r--r--libhb/common.h1
-rw-r--r--libhb/internal.h1
-rw-r--r--libhb/nlmeans.c742
4 files changed, 748 insertions, 0 deletions
diff --git a/libhb/common.c b/libhb/common.c
index 60b926d94..6ba81f762 100644
--- a/libhb/common.c
+++ b/libhb/common.c
@@ -3247,6 +3247,10 @@ hb_filter_object_t * hb_filter_init( int filter_id )
filter = &hb_filter_denoise;
break;
+ case HB_FILTER_NLMEANS:
+ filter = &hb_filter_nlmeans;
+ break;
+
case HB_FILTER_RENDER_SUB:
filter = &hb_filter_render_sub;
break;
diff --git a/libhb/common.h b/libhb/common.h
index 778918db2..2a57b0534 100644
--- a/libhb/common.h
+++ b/libhb/common.h
@@ -1210,6 +1210,7 @@ enum
// Filters that must operate on the original source image are next
HB_FILTER_DEBLOCK,
HB_FILTER_DENOISE,
+ HB_FILTER_NLMEANS,
HB_FILTER_RENDER_SUB,
HB_FILTER_CROP_SCALE,
diff --git a/libhb/internal.h b/libhb/internal.h
index e3b81cd0c..2f7cbacc1 100644
--- a/libhb/internal.h
+++ b/libhb/internal.h
@@ -433,6 +433,7 @@ extern hb_filter_object_t hb_filter_detelecine;
extern hb_filter_object_t hb_filter_deinterlace;
extern hb_filter_object_t hb_filter_deblock;
extern hb_filter_object_t hb_filter_denoise;
+extern hb_filter_object_t hb_filter_nlmeans;
extern hb_filter_object_t hb_filter_decomb;
extern hb_filter_object_t hb_filter_rotate;
extern hb_filter_object_t hb_filter_crop_scale;
diff --git a/libhb/nlmeans.c b/libhb/nlmeans.c
new file mode 100644
index 000000000..ad3f1d393
--- /dev/null
+++ b/libhb/nlmeans.c
@@ -0,0 +1,742 @@
+/* nlmeans.c
+
+ Copyright (c) 2013 Dirk Farin
+ Copyright (c) 2003-2014 HandBrake Team
+ This file is part of the HandBrake source code
+ Homepage: <http://handbrake.fr/>.
+ It may be used under the terms of the GNU General Public License v2.
+ For full terms see the file COPYING file or visit http://www.gnu.org/licenses/gpl-2.0.html
+ */
+
+/* Usage
+ *
+ * Parameters:
+ * lumaY_strength : lumaY_origin_tune : lumaY_patch_size : lumaY_range : lumaY_frames : lumaY_prefilter :
+ * chromaB_strength : chromaB_origin_tune : chromaB_patch_size : chromaB_range : chromaB_frames : chromaB_prefilter :
+ * chromaR_strength : chromaR_origin_tune : chromaR_patch_size : chromaR_range : chromaR_frames : chromaR_prefilter
+ *
+ * Defaults:
+ * 8:1:7:3:2:0 for each channel (equivalent to 8:1:7:3:2:0:8:1:7:3:2:0:8:1:7:3:2:0)
+ *
+ * Parameters cascade, e.g. 6:0.8:7:3:3:0:4:1 sets:
+ * strength 6, origin tune 0.8 for luma
+ * patch size 7, range 3, frames 3, prefilter 0 for all channels
+ * strength 4, origin tune 1 for both chroma channels
+ *
+ * Strength is relative and must be adjusted; ALL parameters affect overall strength.
+ * Lower origin tune improves results for noisier input or animation (film 0.5-1, animation 0.15-0.5).
+ * Large patch size (>9) may greatly reduce quality by clobbering detail.
+ * Larger search range increases quality; however, computation time increases exponentially.
+ * Large number of frames (film >3, animation >6) may cause temporal smearing.
+ * Prefiltering can potentially improve weight decisions, yielding better results for difficult sources.
+ *
+ * Prefilter enum combos:
+ * 1: Mean 3x3
+ * 2: Mean 5x5
+ * 3: Mean 5x5 (overrides Mean 3x3)
+ * 257: Mean 3x3 reduced by 25%
+ * 258: Mean 5x5 reduced by 25%
+ * 513: Mean 3x3 reduced by 50%
+ * 514: Mean 5x5 reduced by 50%
+ * 769: Mean 3x3 reduced by 75%
+ * 770: Mean 5x5 reduced by 75%
+ * 1025: Mean 3x3 plus edge boost (restores lost edge detail)
+ * 1026: Mean 5x5 plus edge boost
+ * 1281: Mean 3x3 reduced by 25% plus edge boost
+ * etc...
+ * 2049: Mean 3x3 passthru (NL-means off, prefilter is the output)
+ * etc...
+ * 3329: Mean 3x3 reduced by 25% plus edge boost, passthru
+ * etc...
+ */
+
+#include "hb.h"
+#include "hbffmpeg.h"
+
+#define NLMEANS_STRENGTH_LUMA_DEFAULT 8
+#define NLMEANS_STRENGTH_CHROMA_DEFAULT 8
+#define NLMEANS_ORIGIN_TUNE_LUMA_DEFAULT 1
+#define NLMEANS_ORIGIN_TUNE_CHROMA_DEFAULT 1
+#define NLMEANS_PATCH_SIZE_LUMA_DEFAULT 7
+#define NLMEANS_PATCH_SIZE_CHROMA_DEFAULT 7
+#define NLMEANS_RANGE_LUMA_DEFAULT 3
+#define NLMEANS_RANGE_CHROMA_DEFAULT 3
+#define NLMEANS_FRAMES_LUMA_DEFAULT 2
+#define NLMEANS_FRAMES_CHROMA_DEFAULT 2
+#define NLMEANS_PREFILTER_LUMA_DEFAULT 0
+#define NLMEANS_PREFILTER_CHROMA_DEFAULT 0
+
+#define NLMEANS_PREFILTER_MODE_MEAN3X3 1
+#define NLMEANS_PREFILTER_MODE_MEAN5X5 2
+#define NLMEANS_PREFILTER_MODE_RESERVED4 4 // Reserved
+#define NLMEANS_PREFILTER_MODE_RESERVED8 8 // Reserved
+#define NLMEANS_PREFILTER_MODE_RESERVED16 16 // Reserved
+#define NLMEANS_PREFILTER_MODE_RESERVED32 32 // Reserved
+#define NLMEANS_PREFILTER_MODE_RESERVED64 64 // Reserved
+#define NLMEANS_PREFILTER_MODE_RESERVED128 128 // Reserved
+#define NLMEANS_PREFILTER_MODE_REDUCE25 256
+#define NLMEANS_PREFILTER_MODE_REDUCE50 512
+#define NLMEANS_PREFILTER_MODE_EDGEBOOST 1024
+#define NLMEANS_PREFILTER_MODE_PASSTHRU 2048
+
+#define NLMEANS_FRAMES_MAX 32
+#define NLMEANS_EXPSIZE 128
+
+typedef struct
+{
+ uint8_t *mem;
+ uint8_t *mem_pre;
+ uint8_t *image;
+ uint8_t *image_pre;
+ int w;
+ int h;
+ int border;
+} BorderedPlane;
+
+struct PixelSum
+{
+ float weight_sum;
+ float pixel_sum;
+};
+
+struct hb_filter_private_s
+{
+ double strength[3]; // averaging weight decay, larger produces smoother output
+ double origin_tune[3]; // weight tuning for origin patch, 0.00..1.00
+ int patch_size[3]; // pixel context region width (must be odd)
+ int range[3]; // spatial search window width (must be odd)
+ int frames[3]; // temporal search depth in frames
+ int prefilter[3]; // prefilter mode, can improve weight analysis
+
+ BorderedPlane frame_tmp[3][32];
+ int frame_ready[3][32];
+};
+
+static int hb_nlmeans_init(hb_filter_object_t *filter,
+ hb_filter_init_t *init);
+
+static int hb_nlmeans_work(hb_filter_object_t *filter,
+ hb_buffer_t **buf_in,
+ hb_buffer_t **buf_out);
+
+static void hb_nlmeans_close(hb_filter_object_t *filter);
+
+hb_filter_object_t hb_filter_nlmeans =
+{
+ .id = HB_FILTER_NLMEANS,
+ .enforce_order = 1,
+ .name = "Denoise (nlmeans)",
+ .settings = NULL,
+ .init = hb_nlmeans_init,
+ .work = hb_nlmeans_work,
+ .close = hb_nlmeans_close,
+};
+
+static void nlmeans_border(uint8_t *src,
+ int w,
+ int h,
+ int border)
+{
+
+ uint8_t *image = src + border + w*border;
+ int iw = w - 2*border;
+ int ih = h - 2*border;
+
+ // Create faux borders using edge pixels
+ for (int y = 0; y < ih; y++)
+ {
+ for (int x = 0; x < border; x++)
+ {
+ *(image + y*w - x - 1) = *(image + y*w + x);
+ *(image + y*w + x + iw) = *(image + y*w - x + (iw-1));
+ }
+ }
+ for (int y = 0; y < border; y++)
+ {
+ memcpy(image - border - (y+1)*w, image - border + y*w, w);
+ memcpy(image - border + (y+ih)*w, image - border + (ih-y-1)*w, w);
+ }
+
+}
+
+static void nlmeans_deborder(uint8_t *src,
+ uint8_t *dst,
+ int w,
+ int h,
+ int border)
+{
+
+ uint8_t *image = src + border + w*border;
+ int iw = w - 2*border;
+ int ih = h - 2*border;
+
+ // Copy main image
+ for (int y = 0; y < ih; y++)
+ {
+ memcpy(dst + y*iw, image + y*w, iw);
+ }
+
+}
+
+static void nlmeans_alloc(uint8_t *src,
+ int src_w,
+ int src_h,
+ BorderedPlane *dst,
+ int dst_w,
+ int dst_h,
+ int border)
+{
+
+ uint8_t *mem = malloc(dst_w * dst_h * sizeof(uint8_t));
+ uint8_t *image = mem + border + dst_w*border;
+
+ // Copy main image
+ for (int y = 0; y < src_h; y++)
+ {
+ memcpy(image + y*dst_w, src + y*src_w, src_w);
+ }
+
+ dst->mem = mem;
+ dst->image = image;
+ dst->w = dst_w;
+ dst->h = dst_h;
+ dst->border = border;
+
+ nlmeans_border(dst->mem, dst->w, dst->h, dst->border);
+ dst->mem_pre = dst->mem;
+ dst->image_pre = dst->image;
+
+}
+
+static void nlmeans_filter_mean(uint8_t *src,
+ uint8_t *dst,
+ int w,
+ int h,
+ int border,
+ int size)
+{
+
+ // Mean filter
+ int iw = w - 2*border;
+ int ih = h - 2*border;
+ int offset_min = -((size - 1) /2);
+ int offset_max = (size + 1) /2;
+ uint16_t pixel_sum;
+ double pixel_weight = 1.0 / (size * size);
+ for (int y = 0; y < ih; y++)
+ {
+ for (int x = 0; x < iw; x++)
+ {
+ pixel_sum = 0;
+ for (int k = offset_min; k < offset_max; k++)
+ {
+ for (int j = offset_min; j < offset_max; j++)
+ {
+ pixel_sum = pixel_sum + *(src + w*(y+j) + (x+k));
+ }
+ }
+ *(dst + w*y + x) = (uint8_t)(pixel_sum * pixel_weight);
+ }
+ }
+
+}
+
+static void nlmeans_filter_edgeboost(uint8_t *src,
+ uint8_t *dst,
+ int w,
+ int h,
+ int border)
+{
+
+ int iw = w - 2*border;
+ int ih = h - 2*border;
+
+ // Custom kernel
+ int kernel_size = 3;
+ int kernel[3][3] = {{-31, 0, 31},
+ {-44, 0, 44},
+ {-31, 0, 31}};
+ double kernel_coef = 1.0 / 27.0;
+
+ // Detect edges
+ int offset_min = -((kernel_size - 1) /2);
+ int offset_max = (kernel_size + 1) /2;
+ uint16_t pixel1;
+ uint16_t pixel2;
+ uint8_t *mask = malloc(iw * ih * sizeof(uint8_t));
+ for (int y = 0; y < ih; y++)
+ {
+ for (int x = 0; x < iw; x++)
+ {
+ pixel1 = 0;
+ pixel2 = 0;
+ for (int k = offset_min; k < offset_max; k++)
+ {
+ for (int j = offset_min; j < offset_max; j++)
+ {
+ pixel1 += kernel[j+1][k+1] * *(src + w*(y+j) + (x+k));
+ pixel2 += kernel[k+1][j+1] * *(src + w*(y+j) + (x+k));
+ }
+ }
+ pixel1 = pixel1 > 0 ? pixel1 : -pixel1;
+ pixel2 = pixel2 > 0 ? pixel2 : -pixel2;
+ pixel1 = (uint16_t)(((double)pixel1 * kernel_coef) + 128);
+ pixel2 = (uint16_t)(((double)pixel2 * kernel_coef) + 128);
+ *(mask + iw*y + x) = (uint8_t)(pixel1 + pixel2);
+ if (*(mask + iw*y + x) > 160)
+ {
+ *(dst + w*y + x) = (3 * *(src + w*y + x) + 1 * *(dst + w*y + x)) /4;
+ //*(dst + w*y + x) = 235;
+ }
+ else if (*(mask + iw*y + x) > 88)
+ {
+ *(dst + w*y + x) = (2 * *(src + w*y + x) + 3 * *(dst + w*y + x)) /5;
+ //*(dst + w*y + x) = 128;
+ }
+ else
+ {
+ //*(dst + w*y + x) = 16;
+ }
+ }
+ }
+
+ free(mask);
+
+}
+
+static void nlmeans_prefilter(BorderedPlane *src,
+ int filter_type)
+{
+
+ if (filter_type & NLMEANS_PREFILTER_MODE_MEAN3X3 ||
+ filter_type & NLMEANS_PREFILTER_MODE_MEAN5X5)
+ {
+
+ // Source image
+ uint8_t *mem = src->mem;
+ uint8_t *image = src->image;
+ int w = src->w;
+ int h = src->h;
+ int border = src->border;
+
+ // Duplicate plane
+ uint8_t *mem_pre = malloc(w * h * sizeof(uint8_t));
+ uint8_t *image_pre = mem_pre + border + w*border;
+ for (int y = 0; y < h; y++)
+ {
+ memcpy(mem_pre + y*w, mem + y*w, w);
+ }
+
+ // Filter plane; should already have at least 2px extra border on each side
+ if (filter_type & NLMEANS_PREFILTER_MODE_MEAN5X5)
+ {
+ // Mean 5x5
+ nlmeans_filter_mean(image, image_pre, w, h, border, 5);
+ }
+ else if (filter_type & NLMEANS_PREFILTER_MODE_MEAN3X3)
+ {
+ // Mean 3x3
+ nlmeans_filter_mean(image, image_pre, w, h, border, 3);
+ }
+
+ // Restore edges
+ if (filter_type & NLMEANS_PREFILTER_MODE_EDGEBOOST)
+ {
+ nlmeans_filter_edgeboost(image, image_pre, w, h, border);
+ }
+
+ // Blend source and destination for lesser effect
+ int wet = 1;
+ int dry = 0;
+ if (filter_type & NLMEANS_PREFILTER_MODE_REDUCE50 &&
+ filter_type & NLMEANS_PREFILTER_MODE_REDUCE25)
+ {
+ wet = 1;
+ dry = 3;
+ }
+ else if (filter_type & NLMEANS_PREFILTER_MODE_REDUCE50)
+ {
+ wet = 1;
+ dry = 1;
+ }
+ else if (filter_type & NLMEANS_PREFILTER_MODE_REDUCE25)
+ {
+ wet = 3;
+ dry = 1;
+ }
+ if (dry > 0)
+ {
+ for (int y = 0; y < h; y++)
+ {
+ for (int x = 0; x < w; x++)
+ {
+ *(mem_pre + w*y + x) = (uint8_t)((wet * *(mem_pre + w*y + x) + dry * *(mem + w*y + x)) / (wet + dry));
+ }
+ }
+ }
+
+ // Assign result
+ src->mem_pre = mem_pre;
+ src->image_pre = image_pre;
+
+ // Recreate borders
+ nlmeans_border(mem_pre, w, h, border);
+
+ }
+
+}
+
+static void nlmeans_plane(BorderedPlane *plane_tmp,
+ int *plane_ready,
+ uint8_t *dst,
+ int w,
+ int h,
+ double h_param,
+ double origin_tune,
+ int n,
+ int r)
+{
+
+ int n_half = (n-1) /2;
+ int r_half = (r-1) /2;
+
+ // Source image
+ uint8_t *src = plane_tmp[0].image;
+ uint8_t *src_pre = plane_tmp[0].image_pre;
+ int src_w = plane_tmp[0].w;
+
+ // Allocate temporary pixel sums
+ struct PixelSum *tmp_data = calloc(w * h, sizeof(struct PixelSum));
+
+ // Allocate integral image
+ int integral_stride = w + 2*16;
+ uint32_t *integral_mem = malloc(integral_stride * (h+1) * sizeof(uint32_t));
+ uint32_t *integral = integral_mem + integral_stride + 16;
+
+ // Precompute exponential table
+ float exptable[NLMEANS_EXPSIZE];
+ const float weight_factor = 1.0/n/n / (h_param * h_param);
+ const float min_weight_in_table = 0.0005;
+ const float stretch = NLMEANS_EXPSIZE / (-log(min_weight_in_table));
+ const float weight_fact_table = weight_factor * stretch;
+ const int diff_max = NLMEANS_EXPSIZE / weight_fact_table;
+ for (int i = 0; i < NLMEANS_EXPSIZE; i++)
+ {
+ exptable[i] = exp(-i/stretch);
+ }
+ exptable[NLMEANS_EXPSIZE-1] = 0;
+
+ // Iterate through available frames
+ for (int plane_index = 0; plane_ready[plane_index] == 1; plane_index++)
+ {
+
+ // Compare image
+ uint8_t *compare = plane_tmp[plane_index].image;
+ uint8_t *compare_pre = plane_tmp[plane_index].image_pre;
+ int compare_w = plane_tmp[plane_index].w;
+
+ // Iterate through all displacements
+ for (int dy = -r_half; dy <= r_half; dy++)
+ {
+ for (int dx = -r_half; dx <= r_half; dx++)
+ {
+
+ // Apply special weight tuning to origin patch
+ if (dx == 0 && dy == 0 && plane_index == 0)
+ {
+ // TODO: Parallelize this
+ for (int y = n_half; y < h-n + n_half; y++)
+ {
+ for (int x = n_half; x < w-n + n_half; x++)
+ {
+ tmp_data[y*w + x].weight_sum += origin_tune;
+ tmp_data[y*w + x].pixel_sum += origin_tune * src[y*src_w + x];
+ }
+ }
+ continue;
+ }
+
+ // Build integral
+ memset(integral-1 - integral_stride, 0, (w+1) * sizeof(uint32_t));
+ for (int y = 0; y < h; y++)
+ {
+ const uint8_t *p1 = src_pre + y*src_w;
+ const uint8_t *p2 = compare_pre + (y+dy)*compare_w + dx;
+ uint32_t *out = integral + (y*integral_stride) - 1;
+
+ *out++ = 0;
+
+ for (int x = 0; x < w; x++)
+ {
+ int diff = *p1++ - *p2++;
+ *out = *(out-1) + diff * diff;
+ out++;
+ }
+
+ if (y > 0)
+ {
+ out = integral + y*integral_stride;
+
+ for (int x = 0; x < w; x++)
+ {
+ *out += *(out - integral_stride);
+ out++;
+ }
+ }
+ }
+
+ // Average displacement
+ // TODO: Parallelize this
+ for (int y = 0; y <= h-n; y++)
+ {
+ const uint32_t *integral_ptr1 = integral + (y -1)*integral_stride - 1;
+ const uint32_t *integral_ptr2 = integral + (y+n-1)*integral_stride - 1;
+
+ for (int x = 0; x <= w-n; x++)
+ {
+ int xc = x + n_half;
+ int yc = y + n_half;
+
+ // Difference between patches
+ int diff = (uint32_t)(integral_ptr2[n] - integral_ptr2[0] - integral_ptr1[n] + integral_ptr1[0]);
+
+ // Sum pixel with weight
+ if (diff < diff_max)
+ {
+ int diffidx = diff * weight_fact_table;
+
+ //float weight = exp(-diff*weightFact);
+ float weight = exptable[diffidx];
+
+ tmp_data[yc*w + xc].weight_sum += weight;
+ tmp_data[yc*w + xc].pixel_sum += weight * compare[(yc+dy)*compare_w + xc + dx];
+ }
+
+ integral_ptr1++;
+ integral_ptr2++;
+ }
+ }
+ }
+ }
+ }
+
+ // Copy edges
+ for (int y = 0; y < h; y++)
+ {
+ for (int x = 0; x < n_half; x++)
+ {
+ *(dst + y*w + x) = *(src + y*src_w - x - 1);
+ *(dst + y*w - x + (w-1)) = *(src + y*src_w + x + w);
+ }
+ }
+ for (int y = 0; y < n_half; y++)
+ {
+ memcpy(dst + y*w, src - (y+1)*src_w, w);
+ memcpy(dst + (h-y-1)*w, src + (y+h)*src_w, w);
+ }
+
+ // Copy main image
+ uint8_t result;
+ for (int y = n_half; y < h-n_half; y++)
+ {
+ for (int x = n_half; x < w-n_half; x++)
+ {
+ result = (uint8_t)(tmp_data[y*w + x].pixel_sum / tmp_data[y*w + x].weight_sum);
+ *(dst + y*w + x) = result ? result : *(src + y*src_w + x);
+ }
+ }
+
+ free(tmp_data);
+ free(integral_mem);
+
+}
+
+static int hb_nlmeans_init(hb_filter_object_t *filter,
+ hb_filter_init_t *init)
+{
+ filter->private_data = calloc(sizeof(struct hb_filter_private_s), 1);
+ hb_filter_private_t *pv = filter->private_data;
+
+ // Mark parameters unset
+ for (int c = 0; c < 3; c++)
+ {
+ pv->strength[c] = -1;
+ pv->origin_tune[c] = -1;
+ pv->patch_size[c] = -1;
+ pv->range[c] = -1;
+ pv->frames[c] = -1;
+ pv->prefilter[c] = -1;
+ }
+
+ // Read user parameters
+ if (filter->settings != NULL)
+ {
+ sscanf(filter->settings, "%lf:%lf:%d:%d:%d:%d:%lf:%lf:%d:%d:%d:%d:%lf:%lf:%d:%d:%d:%d",
+ &pv->strength[0], &pv->origin_tune[0], &pv->patch_size[0], &pv->range[0], &pv->frames[0], &pv->prefilter[0],
+ &pv->strength[1], &pv->origin_tune[1], &pv->patch_size[1], &pv->range[1], &pv->frames[1], &pv->prefilter[1],
+ &pv->strength[2], &pv->origin_tune[2], &pv->patch_size[2], &pv->range[2], &pv->frames[2], &pv->prefilter[2]);
+ }
+
+ // Cascade values
+ // Cr not set; inherit Cb. Cb not set; inherit Y. Y not set; defaults.
+ for (int c = 1; c < 3; c++)
+ {
+ if (pv->strength[c] == -1) { pv->strength[c] = pv->strength[c-1]; }
+ if (pv->origin_tune[c] == -1) { pv->origin_tune[c] = pv->origin_tune[c-1]; }
+ if (pv->patch_size[c] == -1) { pv->patch_size[c] = pv->patch_size[c-1]; }
+ if (pv->range[c] == -1) { pv->range[c] = pv->range[c-1]; }
+ if (pv->frames[c] == -1) { pv->frames[c] = pv->frames[c-1]; }
+ if (pv->prefilter[c] == -1) { pv->prefilter[c] = pv->prefilter[c-1]; }
+ }
+
+ for (int c = 0; c < 3; c++)
+ {
+ // Replace unset values with defaults
+ if (pv->strength[c] == -1) { pv->strength[c] = c ? NLMEANS_STRENGTH_LUMA_DEFAULT : NLMEANS_STRENGTH_CHROMA_DEFAULT; }
+ if (pv->origin_tune[c] == -1) { pv->origin_tune[c] = c ? NLMEANS_ORIGIN_TUNE_LUMA_DEFAULT : NLMEANS_ORIGIN_TUNE_CHROMA_DEFAULT; }
+ if (pv->patch_size[c] == -1) { pv->patch_size[c] = c ? NLMEANS_PATCH_SIZE_LUMA_DEFAULT : NLMEANS_PATCH_SIZE_CHROMA_DEFAULT; }
+ if (pv->range[c] == -1) { pv->range[c] = c ? NLMEANS_RANGE_LUMA_DEFAULT : NLMEANS_RANGE_CHROMA_DEFAULT; }
+ if (pv->frames[c] == -1) { pv->frames[c] = c ? NLMEANS_FRAMES_LUMA_DEFAULT : NLMEANS_FRAMES_CHROMA_DEFAULT; }
+ if (pv->prefilter[c] == -1) { pv->prefilter[c] = c ? NLMEANS_PREFILTER_LUMA_DEFAULT : NLMEANS_PREFILTER_CHROMA_DEFAULT; }
+
+ // Sanitize
+ if (pv->strength[c] < 0) { pv->strength[c] = 0; }
+ if (pv->origin_tune[c] < 0.01) { pv->origin_tune[c] = 0.01; } // avoid black artifacts
+ if (pv->origin_tune[c] > 1) { pv->origin_tune[c] = 1; }
+ if (pv->patch_size[c] % 2 == 0) { pv->patch_size[c]--; }
+ if (pv->patch_size[c] < 1) { pv->patch_size[c] = 1; }
+ if (pv->range[c] % 2 == 0) { pv->range[c]--; }
+ if (pv->range[c] < 1) { pv->range[c] = 1; }
+ if (pv->frames[c] < 1) { pv->frames[c] = 1; }
+ if (pv->frames[c] > NLMEANS_FRAMES_MAX) { pv->frames[c] = NLMEANS_FRAMES_MAX; }
+ if (pv->prefilter[c] < 0) { pv->prefilter[c] = 0; }
+
+ // Mark buffer empty
+ for (int f = 0; f < NLMEANS_FRAMES_MAX; f++)
+ {
+ pv->frame_ready[c][f] = 0;
+ }
+ }
+
+ return 0;
+}
+
+static void hb_nlmeans_close(hb_filter_object_t *filter)
+{
+ hb_filter_private_t *pv = filter->private_data;
+
+ if (pv == NULL)
+ {
+ return;
+ }
+
+ for (int c = 0; c < 3; c++)
+ {
+ for (int f = 0; f < pv->frames[c]; f++)
+ {
+ if (pv->frame_tmp[c][f].mem_pre != NULL &&
+ pv->frame_tmp[c][f].mem_pre != pv->frame_tmp[c][f].mem)
+ {
+ free(pv->frame_tmp[c][f].mem_pre);
+ pv->frame_tmp[c][f].mem_pre = NULL;
+ }
+ if (pv->frame_tmp[c][f].mem != NULL)
+ {
+ free(pv->frame_tmp[c][f].mem);
+ pv->frame_tmp[c][f].mem = NULL;
+ }
+ }
+ }
+
+ free(pv);
+ filter->private_data = NULL;
+}
+
+static int hb_nlmeans_work(hb_filter_object_t *filter,
+ hb_buffer_t **buf_in,
+ hb_buffer_t **buf_out )
+{
+ hb_filter_private_t *pv = filter->private_data;
+ hb_buffer_t *in = *buf_in, *out;
+
+ if (in->size <= 0)
+ {
+ *buf_out = in;
+ *buf_in = NULL;
+ return HB_FILTER_DONE;
+ }
+
+ out = hb_video_buffer_init(in->f.width, in->f.height);
+
+ for (int c = 0; c < 3; c++)
+ {
+
+ if (pv->strength[c] == 0)
+ {
+ out->plane[c].data = in->plane[c].data;
+ continue;
+ }
+
+ int frames = pv->frames[c];
+
+ // Release last frame in buffer
+ if (pv->frame_tmp[c][frames-1].mem_pre != NULL &&
+ pv->frame_tmp[c][frames-1].mem_pre != pv->frame_tmp[c][frames-1].mem)
+ {
+ free(pv->frame_tmp[c][frames-1].mem_pre);
+ pv->frame_tmp[c][frames-1].mem_pre = NULL;
+ }
+ if (pv->frame_tmp[c][frames-1].mem != NULL)
+ {
+ free(pv->frame_tmp[c][frames-1].mem);
+ pv->frame_tmp[c][frames-1].mem = NULL;
+ }
+ pv->frame_ready[c][frames-1] = 0;
+
+ // Shift frames in buffer down one level
+ for (int f = frames-1; f > 0; f--)
+ {
+ pv->frame_tmp[c][f] = pv->frame_tmp[c][f-1];
+ pv->frame_ready[c][f] = pv->frame_ready[c][f-1];
+ }
+
+ // Extend copy of plane with extra border and place in buffer
+ int border = ((pv->range[c] + 2) / 2 + 15) /16*16;
+ int w = in->plane[c].stride + 2*border;
+ int h = in->plane[c].height + 2*border;
+ nlmeans_alloc(in->plane[c].data,
+ in->plane[c].stride,
+ in->plane[c].height,
+ &pv->frame_tmp[c][0],
+ w,
+ h,
+ border);
+ nlmeans_prefilter(&pv->frame_tmp[c][0], pv->prefilter[c]);
+ pv->frame_ready[c][0] = 1;
+
+ if (pv->prefilter[c] & NLMEANS_PREFILTER_MODE_PASSTHRU)
+ {
+ nlmeans_deborder(pv->frame_tmp[c][0].mem_pre, out->plane[c].data, w, h, border);
+ continue;
+ }
+
+ // Process current plane
+ nlmeans_plane(pv->frame_tmp[c],
+ pv->frame_ready[c],
+ out->plane[c].data,
+ in->plane[c].stride,
+ in->plane[c].height,
+ pv->strength[c],
+ pv->origin_tune[c],
+ pv->patch_size[c],
+ pv->range[c]);
+
+ }
+
+ out->s = in->s;
+ hb_buffer_move_subs(out, in);
+
+ *buf_out = out;
+
+ return HB_FILTER_OK;
+}