HandBrake/libhb/denoise.c

371 lines
12 KiB
C

/*
Copyright (c) 2003 Daniel Moreno <comac AT comac DOT darktech DOT org>
Copyright (c) 2010 Baptiste Coudurier
Copyright (c) 2012 Loren Merritt
ported from FFmpeg.
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
*/
#include "handbrake/handbrake.h"
#include "handbrake/hbffmpeg.h"
#include "libavutil/intreadwrite.h"
#define HQDN3D_SPATIAL_LUMA_DEFAULT 4.0f
#define HQDN3D_SPATIAL_CHROMA_DEFAULT 3.0f
#define HQDN3D_TEMPORAL_LUMA_DEFAULT 6.0f
#define LUT_BITS (depth==16 ? 8 : 4)
#define LOAD(x) (((depth == 8 ? frame_src[x] : AV_RN16A(frame_src + (x) * 2)) << (16 - depth))\
+ (((1 << (16 - depth)) - 1) >> 1))
#define STORE(x,val) (depth == 8 ? frame_dst[x] = (val) >> (16 - depth) : \
AV_WN16A(frame_dst + (x) * 2, (val) >> (16 - depth)))
struct hb_filter_private_s
{
int16_t *hqdn3d_coef[6];
uint16_t *hqdn3d_line;
uint16_t *hqdn3d_frame[3];
int hsub, vsub;
int depth;
hb_filter_init_t input;
hb_filter_init_t output;
};
static int hb_denoise_init(hb_filter_object_t *filter,
hb_filter_init_t *init );
static int hb_denoise_work(hb_filter_object_t *filter,
hb_buffer_t **buf_in,
hb_buffer_t **buf_out);
static void hb_denoise_close(hb_filter_object_t *filter);
static const char denoise_template[] =
"y-spatial=^"HB_FLOAT_REG"$:cb-spatial=^"HB_FLOAT_REG"$:"
"cr-spatial=^"HB_FLOAT_REG"$:"
"y-temporal=^"HB_FLOAT_REG"$:cb-temporal=^"HB_FLOAT_REG"$:"
"cr-temporal=^"HB_FLOAT_REG"$";
hb_filter_object_t hb_filter_denoise =
{
.id = HB_FILTER_DENOISE,
.enforce_order = 1,
.name = "Denoise (hqdn3d)",
.settings = NULL,
.init = hb_denoise_init,
.work = hb_denoise_work,
.close = hb_denoise_close,
.settings_template = denoise_template,
};
static void hqdn3d_precalc_coef(int16_t *ct, int depth, double dist25)
{
int i;
double gamma, simil, C;
gamma = log(0.25) / log(1.0 - FFMIN(dist25,252.0)/255.0 - 0.00001);
for (i = -(256<<LUT_BITS); i < 256<<LUT_BITS; i++)
{
double f = (i * (1 << (9-LUT_BITS)) + (1<<(8-LUT_BITS)) - 1) / 512.0; // midpoint of the bin
simil = FFMAX(0, 1.0 - fabs(f) / 255.0);
C = pow(simil, gamma) * 256.0 * f;
ct[(256<<LUT_BITS)+i] = lrint(C);
}
ct[0] = !!dist25;
}
static inline unsigned int hqdn3d_lowpass_mul(int prev_mul, int curr_mul, int16_t *coef, int depth)
{
int d = (prev_mul - curr_mul) >> (8 - LUT_BITS);
return curr_mul + coef[d];
}
static void hqdn3d_denoise_temporal(uint8_t *frame_src, uint8_t *frame_dst,
uint16_t *frame_ant,
int w, int h, int sstride, int dstride,
int16_t *temporal, int depth)
{
long x, y;
uint32_t tmp;
temporal += 256 << LUT_BITS;
for (y = 0; y < h; y++)
{
for (x = 0; x < w; x++)
{
frame_ant[x] = tmp = hqdn3d_lowpass_mul(frame_ant[x], LOAD(x), temporal, depth);
STORE(x, tmp);
}
frame_src += sstride;
frame_dst += dstride;
frame_ant += w;
}
}
static void hqdn3d_denoise_spatial(uint8_t *frame_src, uint8_t *frame_dst,
uint16_t *line_ant, uint16_t *frame_ant,
int w, int h, int sstride, int dstride,
int16_t *spatial, int16_t *temporal, int depth)
{
long x, y;
uint32_t pixel_ant;
uint32_t tmp;
spatial += 256 << LUT_BITS;
temporal += 256 << LUT_BITS;
/* First line has no top neighbor. Only left one for each tmp and last frame */
pixel_ant = LOAD(0);
for (x = 0; x < w; x++)
{
line_ant[x] = tmp = pixel_ant = hqdn3d_lowpass_mul(pixel_ant, LOAD(x), spatial, depth);
frame_ant[x] = tmp = hqdn3d_lowpass_mul(frame_ant[x], tmp, temporal, depth);
STORE(x, tmp);
}
for (y = 1; y < h; y++)
{
frame_src += sstride;
frame_dst += dstride;
frame_ant += w;
pixel_ant = LOAD(0);
for (x = 0; x < w-1; x++)
{
line_ant[x] = tmp = hqdn3d_lowpass_mul(line_ant[x], pixel_ant, spatial, depth);
pixel_ant = hqdn3d_lowpass_mul(pixel_ant, LOAD(x+1), spatial, depth);
frame_ant[x] = tmp = hqdn3d_lowpass_mul(frame_ant[x], tmp, temporal, depth);
STORE(x, tmp);
}
line_ant[x] = tmp = hqdn3d_lowpass_mul(line_ant[x], pixel_ant, spatial, depth);
frame_ant[x] = tmp = hqdn3d_lowpass_mul(frame_ant[x], tmp, temporal, depth);
STORE(x, tmp);
}
}
static void hqdn3d_denoise_depth(uint8_t *frame_src, uint8_t *frame_dst,
uint16_t *line_ant, uint16_t **frame_ant_ptr,
int w, int h, int sstride, int dstride,
int16_t *spatial, int16_t *temporal, int depth)
{
long x, y;
uint16_t *frame_ant = (*frame_ant_ptr);
if (!frame_ant)
{
uint8_t *src = frame_src;
(*frame_ant_ptr) = frame_ant = calloc(w * h, sizeof(uint16_t));
for (y = 0; y < h; y++, frame_src += sstride, frame_ant += w)
{
for (x = 0; x < w; x++)
{
frame_ant[x] = LOAD(x);
}
}
frame_src = src;
frame_ant = *frame_ant_ptr;
}
/* If no spatial coefficients, do temporal denoise only */
if (spatial[0])
{
hqdn3d_denoise_spatial(frame_src, frame_dst, line_ant, frame_ant,
w, h, sstride, dstride, spatial, temporal, depth);
}
else
{
hqdn3d_denoise_temporal(frame_src, frame_dst, frame_ant,
w, h, sstride, dstride, temporal, depth);
}
}
#define hqdn3d_denoise(...) \
switch (pv->depth) { \
case 8: hqdn3d_denoise_depth(__VA_ARGS__, 8); break; \
case 9: hqdn3d_denoise_depth(__VA_ARGS__, 9); break; \
case 10: hqdn3d_denoise_depth(__VA_ARGS__, 10); break; \
case 12: hqdn3d_denoise_depth(__VA_ARGS__, 12); break; \
case 14: hqdn3d_denoise_depth(__VA_ARGS__, 14); break; \
case 16: hqdn3d_denoise_depth(__VA_ARGS__, 16); break; \
} \
static int hb_denoise_init( hb_filter_object_t * filter,
hb_filter_init_t * init )
{
filter->private_data = calloc( sizeof(struct hb_filter_private_s), 1 );
if (filter->private_data == NULL)
{
hb_error("denoise: calloc failed");
return -1;
}
hb_filter_private_t * pv = filter->private_data;
const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(init->pix_fmt);
int i, depth;
pv->hsub = desc->log2_chroma_w;
pv->vsub = desc->log2_chroma_h;
pv->depth = depth = desc->comp[0].depth;
double spatial_luma, spatial_chroma_b, spatial_chroma_r;
double temporal_luma, temporal_chroma_b, temporal_chroma_r;
pv->input = *init;
if (!hb_dict_extract_double(&spatial_luma, filter->settings, "y-spatial"))
{
spatial_luma = HQDN3D_SPATIAL_LUMA_DEFAULT;
}
if (!hb_dict_extract_double(&spatial_chroma_b, filter->settings, "cb-spatial"))
{
spatial_chroma_b = HQDN3D_SPATIAL_CHROMA_DEFAULT *
spatial_luma / HQDN3D_SPATIAL_LUMA_DEFAULT;
}
if (!hb_dict_extract_double(&spatial_chroma_r, filter->settings, "cr-spatial"))
{
spatial_chroma_r = spatial_chroma_b;
}
if (!hb_dict_extract_double(&temporal_luma, filter->settings, "y-temporal"))
{
temporal_luma = HQDN3D_TEMPORAL_LUMA_DEFAULT *
spatial_luma / HQDN3D_SPATIAL_LUMA_DEFAULT;
}
if (!hb_dict_extract_double(&temporal_chroma_b, filter->settings, "cb-temporal"))
{
temporal_chroma_b = temporal_luma * spatial_chroma_b / spatial_luma;
}
if (!hb_dict_extract_double(&temporal_chroma_r, filter->settings, "cr-temporal"))
{
temporal_chroma_r = temporal_chroma_b;
}
for (i = 0; i < 6; i++)
{
pv->hqdn3d_coef[i] = av_malloc((512<<LUT_BITS) * sizeof(int16_t));
if (!pv->hqdn3d_coef[i])
{
return 0;
}
}
hqdn3d_precalc_coef(pv->hqdn3d_coef[0], pv->depth, spatial_luma);
hqdn3d_precalc_coef(pv->hqdn3d_coef[1], pv->depth, temporal_luma);
hqdn3d_precalc_coef(pv->hqdn3d_coef[2], pv->depth, spatial_chroma_b);
hqdn3d_precalc_coef(pv->hqdn3d_coef[3], pv->depth, temporal_chroma_b);
hqdn3d_precalc_coef(pv->hqdn3d_coef[4], pv->depth, spatial_chroma_r);
hqdn3d_precalc_coef(pv->hqdn3d_coef[5], pv->depth, temporal_chroma_r);
pv->output = *init;
return 0;
}
static void hb_denoise_close(hb_filter_object_t * filter)
{
hb_filter_private_t *pv = filter->private_data;
int i;
if (!pv)
{
return;
}
for (i = 0; i < 6; i++)
{
av_freep(&pv->hqdn3d_coef[i]);
}
if (pv->hqdn3d_line)
{
free(pv->hqdn3d_line);
pv->hqdn3d_line = NULL;
}
if (pv->hqdn3d_frame[0])
{
free(pv->hqdn3d_frame[0]);
pv->hqdn3d_frame[0] = NULL;
}
if (pv->hqdn3d_frame[1])
{
free(pv->hqdn3d_frame[1]);
pv->hqdn3d_frame[1] = NULL;
}
if (pv->hqdn3d_frame[2])
{
free(pv->hqdn3d_frame[2]);
pv->hqdn3d_frame[2] = NULL;
}
free(pv);
filter->private_data = NULL;
}
static int hb_denoise_work(hb_filter_object_t *filter,
hb_buffer_t **buf_in,
hb_buffer_t **buf_out)
{
hb_filter_private_t *pv = filter->private_data;
hb_buffer_t *in = *buf_in, *out;
if (in->s.flags & HB_BUF_FLAG_EOF)
{
*buf_out = in;
*buf_in = NULL;
return HB_FILTER_DONE;
}
out = hb_frame_buffer_init(pv->output.pix_fmt, in->f.width, in->f.height);
out->f.color_prim = pv->output.color_prim;
out->f.color_transfer = pv->output.color_transfer;
out->f.color_matrix = pv->output.color_matrix;
out->f.color_range = pv->output.color_range;
out->f.chroma_location = pv->output.chroma_location;
if (!pv->hqdn3d_line)
{
pv->hqdn3d_line = malloc(in->plane[0].stride * sizeof(uint16_t));
}
int c, coef_index;
for (c = 0; c < 3; c++)
{
coef_index = c * 2;
hqdn3d_denoise(in->plane[c].data,
out->plane[c].data,
pv->hqdn3d_line,
&pv->hqdn3d_frame[c],
AV_CEIL_RSHIFT(in->f.width, (!!c * pv->hsub)),
AV_CEIL_RSHIFT(in->f.height, (!!c * pv->vsub)),
in->plane[c].stride,
out->plane[c].stride,
pv->hqdn3d_coef[coef_index],
pv->hqdn3d_coef[coef_index+1]);
}
hb_buffer_copy_props(out, in);
*buf_out = out;
return HB_FILTER_OK;
}