source/libvpx/vp9/encoder/vp9_denoiser.c - Issue 375983002: libvpx: Pull from upstream

Unified Diff: source/libvpx/vp9/encoder/vp9_denoiser.c

Issue 375983002: libvpx: Pull from upstream (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/deps/third_party/libvpx/

Patch Set: Created 6 years, 5 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: source/libvpx/vp9/encoder/vp9_denoiser.c

===================================================================

--- source/libvpx/vp9/encoder/vp9_denoiser.c (revision 281795)

+++ source/libvpx/vp9/encoder/vp9_denoiser.c (working copy)

@@ -9,38 +9,90 @@

#include <assert.h>

+#include <limits.h>

#include "vpx_scale/yv12config.h"

#include "vpx/vpx_integer.h"

+#include "vp9/common/vp9_reconinter.h"

#include "vp9/encoder/vp9_denoiser.h"

+/* The VP9 denoiser is a work-in-progress. It currently is only designed to work

+ * with speed 6, though it (inexplicably) seems to also work with speed 5 (one

+ * would need to modify the source code in vp9_pickmode.c and vp9_encoder.c to

+ * make the calls to the vp9_denoiser_* functions when in speed 5).

+ *

+ * The implementation is very similar to that of the VP8 denoiser. While

+ * choosing the motion vectors / reference frames, the denoiser is run, and if

+ * it did not modify the signal to much, the denoised block is copied to the

+ * signal.

+ */

+#ifdef OUTPUT_YUV_DENOISED

+static void make_grayscale(YV12_BUFFER_CONFIG *yuv);

+#endif

static const int widths[] = {4, 4, 8, 8, 8, 16, 16, 16, 32, 32, 32, 64, 64};

static const int heights[] = {4, 8, 4, 8, 16, 8, 16, 32, 16, 32, 64, 32, 64};

-int vp9_denoiser_filter() {

- return 0;

+static int absdiff_thresh(BLOCK_SIZE bs, int increase_denoising) {

+ (void)bs;

+ return 3 + (increase_denoising ? 1 : 0);

}

-static int update_running_avg(const uint8_t *mc_avg, int mc_avg_stride,

- uint8_t *avg, int avg_stride,

- const uint8_t *sig, int sig_stride,

- int increase_denoising, BLOCK_SIZE bs) {

+static int delta_thresh(BLOCK_SIZE bs, int increase_denoising) {

+ (void)bs;

+ (void)increase_denoising;

+ return 4;

+static int noise_motion_thresh(BLOCK_SIZE bs, int increase_denoising) {

+ (void)bs;

+ (void)increase_denoising;

+ return 25 * 25;

+static unsigned int sse_thresh(BLOCK_SIZE bs, int increase_denoising) {

+ return widths[bs] * heights[bs] * (increase_denoising ? 60 : 40);

+static int sse_diff_thresh(BLOCK_SIZE bs, int increase_denoising,

+ int mv_row, int mv_col) {

+ if (mv_row * mv_row + mv_col * mv_col >

+ noise_motion_thresh(bs, increase_denoising)) {

+ return 0;

+ } else {

+ return widths[bs] * heights[bs] * 20;

+ }

+static int total_adj_strong_thresh(BLOCK_SIZE bs, int increase_denoising) {

+ return widths[bs] * heights[bs] * (increase_denoising ? 3 : 2);

+static int total_adj_weak_thresh(BLOCK_SIZE bs, int increase_denoising) {

+ return widths[bs] * heights[bs] * (increase_denoising ? 3 : 2);

+static VP9_DENOISER_DECISION denoiser_filter(const uint8_t *sig, int sig_stride,

+ const uint8_t *mc_avg,

+ int mc_avg_stride,

+ uint8_t *avg, int avg_stride,

+ int increase_denoising,

+ BLOCK_SIZE bs) {

int r, c;

- int diff, adj, absdiff;

- int shift_inc1 = 0, shift_inc2 = 1;

+ const uint8_t *sig_start = sig;

+ const uint8_t *mc_avg_start = mc_avg;

+ uint8_t *avg_start = avg;

+ int diff, adj, absdiff, delta;

int adj_val[] = {3, 4, 6};

int total_adj = 0;

- if (increase_denoising) {

- shift_inc1 = 1;

- shift_inc2 = 2;

- }

+ // First attempt to apply a strong temporal denoising filter.

for (r = 0; r < heights[bs]; ++r) {

for (c = 0; c < widths[bs]; ++c) {

diff = mc_avg[c] - sig[c];

absdiff = abs(diff);

- if (absdiff <= 3 + shift_inc1) {

+ if (absdiff <= absdiff_thresh(bs, increase_denoising)) {

avg[c] = mc_avg[c];

total_adj += diff;

} else {

@@ -68,7 +120,47 @@

avg += avg_stride;

mc_avg += mc_avg_stride;

}

- return total_adj;

+ // If the strong filter did not modify the signal too much, we're all set.

+ if (abs(total_adj) <= total_adj_strong_thresh(bs, increase_denoising)) {

+ return FILTER_BLOCK;

+ }

+ // Otherwise, we try to dampen the filter if the delta is not too high.

+ delta = ((abs(total_adj) - total_adj_strong_thresh(bs, increase_denoising))

+ >> 8) + 1;

+ if (delta > delta_thresh(bs, increase_denoising)) {

+ return COPY_BLOCK;

+ }

+ mc_avg = mc_avg_start;

+ avg = avg_start;

+ sig = sig_start;

+ for (r = 0; r < heights[bs]; ++r) {

+ for (c = 0; c < widths[bs]; ++c) {

+ diff = mc_avg[c] - sig[c];

+ adj = abs(diff);

+ if (adj > delta) {

+ adj = delta;

+ }

+ if (diff > 0) {

+ avg[c] = MAX(0, avg[c] - adj);

+ total_adj += adj;

+ } else {

+ avg[c] = MIN(UINT8_MAX, avg[c] + adj);

+ total_adj -= adj;

+ }

+ sig += sig_stride;

+ avg += avg_stride;

+ mc_avg += mc_avg_stride;

+ }

+ // We can use the filter if it has been sufficiently dampened

+ if (abs(total_adj) <= total_adj_weak_thresh(bs, increase_denoising)) {

+ return FILTER_BLOCK;

+ }

+ return COPY_BLOCK;

}

static uint8_t *block_start(uint8_t *framebuf, int stride,

@@ -76,51 +168,174 @@

return framebuf + (stride * mi_row * 8) + (mi_col * 8);

}

-void copy_block(uint8_t *dest, int dest_stride,

- uint8_t *src, int src_stride, BLOCK_SIZE bs) {

- int r, c;

+static void copy_block(uint8_t *dest, int dest_stride,

+ const uint8_t *src, int src_stride, BLOCK_SIZE bs) {

+ int r;

for (r = 0; r < heights[bs]; ++r) {

- for (c = 0; c < widths[bs]; ++c) {

- dest[c] = src[c];

- }

+ vpx_memcpy(dest, src, widths[bs]);

dest += dest_stride;

src += src_stride;

}

+static VP9_DENOISER_DECISION perform_motion_compensation(VP9_DENOISER *denoiser,

+ MACROBLOCK *mb,

+ BLOCK_SIZE bs,

+ int increase_denoising,

+ int mi_row,

+ int mi_col) {

+ int mv_col, mv_row;

+ int sse_diff = denoiser->zero_mv_sse - denoiser->best_sse;

+ MV_REFERENCE_FRAME frame;

+ MACROBLOCKD *filter_mbd = &mb->e_mbd;

+ MB_MODE_INFO *mbmi = &filter_mbd->mi[0]->mbmi;

+ // We will restore these after motion compensation.

+ MB_MODE_INFO saved_mbmi = *mbmi;

+ struct buf_2d saved_dst = filter_mbd->plane[0].dst;

+ struct buf_2d saved_pre[2];

+ saved_pre[0] = filter_mbd->plane[0].pre[0];

+ saved_pre[1] = filter_mbd->plane[0].pre[1];

+ mv_col = denoiser->best_sse_mv.as_mv.col;

+ mv_row = denoiser->best_sse_mv.as_mv.row;

+ frame = denoiser->best_reference_frame;

+ // If the best reference frame uses inter-prediction and there is enough of a

+ // difference in sum-squared-error, use it.

+ if (frame != INTRA_FRAME &&

+ sse_diff > sse_diff_thresh(bs, increase_denoising, mv_row, mv_col)) {

+ mbmi->ref_frame[0] = denoiser->best_reference_frame;

+ mbmi->mode = denoiser->best_sse_inter_mode;

+ mbmi->mv[0] = denoiser->best_sse_mv;

+ } else {

+ // Otherwise, use the zero reference frame.

+ frame = denoiser->best_zeromv_reference_frame;

+ mbmi->ref_frame[0] = denoiser->best_zeromv_reference_frame;

+ mbmi->mode = ZEROMV;

+ mbmi->mv[0].as_int = 0;

+ denoiser->best_sse_inter_mode = ZEROMV;

+ denoiser->best_sse_mv.as_int = 0;

+ denoiser->best_sse = denoiser->zero_mv_sse;

+ }

+ // Set the pointers in the MACROBLOCKD to point to the buffers in the denoiser

+ // struct.

+ filter_mbd->plane[0].pre[0].buf =

+ block_start(denoiser->running_avg_y[frame].y_buffer,

+ denoiser->running_avg_y[frame].y_stride,

+ mi_row, mi_col);

+ filter_mbd->plane[0].pre[0].stride = denoiser->running_avg_y[frame].y_stride;

+ filter_mbd->plane[1].pre[0].buf =

+ block_start(denoiser->running_avg_y[frame].u_buffer,

+ denoiser->running_avg_y[frame].uv_stride,

+ mi_row, mi_col);

+ filter_mbd->plane[1].pre[0].stride = denoiser->running_avg_y[frame].uv_stride;

+ filter_mbd->plane[2].pre[0].buf =

+ block_start(denoiser->running_avg_y[frame].v_buffer,

+ denoiser->running_avg_y[frame].uv_stride,

+ mi_row, mi_col);

+ filter_mbd->plane[2].pre[0].stride = denoiser->running_avg_y[frame].uv_stride;

+ filter_mbd->plane[0].pre[1].buf =

+ block_start(denoiser->running_avg_y[frame].y_buffer,

+ denoiser->running_avg_y[frame].y_stride,

+ mi_row, mi_col);

+ filter_mbd->plane[0].pre[1].stride = denoiser->running_avg_y[frame].y_stride;

+ filter_mbd->plane[1].pre[1].buf =

+ block_start(denoiser->running_avg_y[frame].u_buffer,

+ denoiser->running_avg_y[frame].uv_stride,

+ mi_row, mi_col);

+ filter_mbd->plane[1].pre[1].stride = denoiser->running_avg_y[frame].uv_stride;

+ filter_mbd->plane[2].pre[1].buf =

+ block_start(denoiser->running_avg_y[frame].v_buffer,

+ denoiser->running_avg_y[frame].uv_stride,

+ mi_row, mi_col);

+ filter_mbd->plane[2].pre[1].stride = denoiser->running_avg_y[frame].uv_stride;

+ filter_mbd->plane[0].dst.buf =

+ block_start(denoiser->mc_running_avg_y.y_buffer,

+ denoiser->mc_running_avg_y.y_stride,

+ mi_row, mi_col);

+ filter_mbd->plane[0].dst.stride = denoiser->mc_running_avg_y.y_stride;

+ filter_mbd->plane[1].dst.buf =

+ block_start(denoiser->mc_running_avg_y.u_buffer,

+ denoiser->mc_running_avg_y.uv_stride,

+ mi_row, mi_col);

+ filter_mbd->plane[1].dst.stride = denoiser->mc_running_avg_y.y_stride;

+ filter_mbd->plane[2].dst.buf =

+ block_start(denoiser->mc_running_avg_y.v_buffer,

+ denoiser->mc_running_avg_y.uv_stride,

+ mi_row, mi_col);

+ filter_mbd->plane[2].dst.stride = denoiser->mc_running_avg_y.y_stride;

+ vp9_build_inter_predictors_sby(filter_mbd, mv_row, mv_col, bs);

+ // Restore everything to its original state

+ filter_mbd->plane[0].pre[0] = saved_pre[0];

+ filter_mbd->plane[0].pre[1] = saved_pre[1];

+ filter_mbd->plane[0].dst = saved_dst;

+ *mbmi = saved_mbmi;

+ mv_row = denoiser->best_sse_mv.as_mv.row;

+ mv_col = denoiser->best_sse_mv.as_mv.col;

+ if (denoiser->best_sse > sse_thresh(bs, increase_denoising)) {

+ return COPY_BLOCK;

+ }

+ if (mv_row * mv_row + mv_col * mv_col >

+ 8 * noise_motion_thresh(bs, increase_denoising)) {

+ return COPY_BLOCK;

+ }

+ return FILTER_BLOCK;

void vp9_denoiser_denoise(VP9_DENOISER *denoiser, MACROBLOCK *mb,

int mi_row, int mi_col, BLOCK_SIZE bs) {

- int decision = COPY_BLOCK;

+ VP9_DENOISER_DECISION decision = FILTER_BLOCK;

YV12_BUFFER_CONFIG avg = denoiser->running_avg_y[INTRA_FRAME];

+ YV12_BUFFER_CONFIG mc_avg = denoiser->mc_running_avg_y;

+ uint8_t *avg_start = block_start(avg.y_buffer, avg.y_stride, mi_row, mi_col);

+ uint8_t *mc_avg_start = block_start(mc_avg.y_buffer, mc_avg.y_stride,

+ mi_row, mi_col);

struct buf_2d src = mb->plane[0].src;

- update_running_avg(denoiser->mc_running_avg_y.y_buffer,

- denoiser->mc_running_avg_y.y_stride,

- denoiser->running_avg_y[INTRA_FRAME].y_buffer,

- denoiser->running_avg_y[INTRA_FRAME].y_stride,

- mb->plane[0].src.buf, mb->plane[0].src.stride, 0, bs);

+ decision = perform_motion_compensation(denoiser, mb, bs,

+ denoiser->increase_denoising,

+ mi_row, mi_col);

if (decision == FILTER_BLOCK) {

- // TODO(tkopp)

+ decision = denoiser_filter(src.buf, src.stride,

+ mc_avg_start, mc_avg.y_stride,

+ avg_start, avg.y_stride,

+ 0, bs);

}

- if (decision == COPY_BLOCK) {

- copy_block(block_start(avg.y_buffer, avg.y_stride, mi_row, mi_col),

- avg.y_stride, src.buf, src.stride, bs);

+ if (decision == FILTER_BLOCK) {

+ copy_block(src.buf, src.stride, avg_start, avg.y_stride, bs);

+ } else { // COPY_BLOCK

+ copy_block(avg_start, avg.y_stride, src.buf, src.stride, bs);

}

static void copy_frame(YV12_BUFFER_CONFIG dest, const YV12_BUFFER_CONFIG src) {

- int r, c;

+ int r;

const uint8_t *srcbuf = src.y_buffer;

uint8_t *destbuf = dest.y_buffer;

assert(dest.y_width == src.y_width);

assert(dest.y_height == src.y_height);

for (r = 0; r < dest.y_height; ++r) {

- for (c = 0; c < dest.y_width; ++c) {

- destbuf[c] = srcbuf[c];

- }

+ vpx_memcpy(destbuf, srcbuf, dest.y_width);

destbuf += dest.y_stride;

srcbuf += src.y_stride;

}

@@ -155,9 +370,27 @@

}

-void vp9_denoiser_update_frame_stats() {

+void vp9_denoiser_reset_frame_stats(VP9_DENOISER *denoiser) {

+ denoiser->zero_mv_sse = UINT_MAX;

+ denoiser->best_sse = UINT_MAX;

}

+void vp9_denoiser_update_frame_stats(VP9_DENOISER *denoiser, MB_MODE_INFO *mbmi,

+ unsigned int sse, PREDICTION_MODE mode) {

+ // TODO(tkopp): Use both MVs if possible

+ if (mbmi->mv[0].as_int == 0 && sse < denoiser->zero_mv_sse) {

+ denoiser->zero_mv_sse = sse;

+ denoiser->best_zeromv_reference_frame = mbmi->ref_frame[0];

+ }

+ if (mbmi->mv[0].as_int != 0 && sse < denoiser->best_sse) {

+ denoiser->best_sse = sse;

+ denoiser->best_sse_inter_mode = mode;

+ denoiser->best_sse_mv = mbmi->mv[0];

+ denoiser->best_reference_frame = mbmi->ref_frame[0];

+ }

int vp9_denoiser_alloc(VP9_DENOISER *denoiser, int width, int height,

int ssx, int ssy, int border) {

int i, fail;

@@ -170,6 +403,9 @@

vp9_denoiser_free(denoiser);

return 1;

}

+#ifdef OUTPUT_YUV_DENOISED

+ make_grayscale(&denoiser->running_avg_y[i]);

+#endif

}

fail = vp9_alloc_frame_buffer(&denoiser->mc_running_avg_y, width, height,

@@ -178,6 +414,10 @@

vp9_denoiser_free(denoiser);

return 1;

}

+#ifdef OUTPUT_YUV_DENOISED

+ make_grayscale(&denoiser->running_avg_y[i]);

+#endif

+ denoiser->increase_denoising = 0;

return 0;

}

@@ -196,3 +436,22 @@

vp9_free_frame_buffer(&denoiser->mc_running_avg_y);

}

+#ifdef OUTPUT_YUV_DENOISED

+static void make_grayscale(YV12_BUFFER_CONFIG *yuv) {

+ int r, c;

+ uint8_t *u = yuv->u_buffer;

+ uint8_t *v = yuv->v_buffer;

+ // The '/2's are there because we have a 440 buffer, but we want to output

+ // 420.

+ for (r = 0; r < yuv->uv_height / 2; ++r) {

+ for (c = 0; c < yuv->uv_width / 2; ++c) {

+ u[c] = UINT8_MAX / 2;

+ v[c] = UINT8_MAX / 2;

+ }

+ u += yuv->uv_stride + yuv->uv_width / 2;

+ v += yuv->uv_stride + yuv->uv_width / 2;

+ }

+#endif

« no previous file with comments | « source/libvpx/vp9/encoder/vp9_denoiser.h ('k') | source/libvpx/vp9/encoder/vp9_encodeframe.h » ('j') | no next file with comments »