FFmpeg coverage


Directory: ../../../ffmpeg/
File: src/libavfilter/vf_owdenoise.c
Date: 2023-10-02 11:06:47
Exec Total Coverage
Lines: 110 139 79.1%
Functions: 10 10 100.0%
Branches: 57 82 69.5%

Line Branch Exec Source
1 /*
2 * Copyright (c) 2007 Michael Niedermayer <michaelni@gmx.at>
3 * Copyright (c) 2013 Clément Bœsch <u pkh me>
4 *
5 * This file is part of FFmpeg.
6 *
7 * FFmpeg is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2 of the License, or
10 * (at your option) any later version.
11 *
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License along
18 * with FFmpeg; if not, write to the Free Software Foundation, Inc.,
19 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
20 */
21
22 // The code written by Michael Niedermayer in 70024b6b47b9eacfe01e8f92349ca9bf1ccd7d5a:libavfilter/vf_owdenoise.c
23 // can also be used under the LGPL due to:
24 // <michaelni> durandal_1707, if you do all the "todo" points from vf_owdenoise.c that are in that file since 2013 then sure i would be more than happy to relicense my part of it to LGPL
25 // <durandal_1707> michaelni: first relicense than work
26
27 /**
28 * @todo try to change to int
29 * @todo try lifting based implementation
30 * @todo optimize optimize optimize
31 * @todo hard thresholding
32 * @todo use QP to decide filter strength
33 * @todo wavelet normalization / least squares optimal signal vs. noise thresholds
34 */
35
36 #include "libavutil/imgutils.h"
37 #include "libavutil/opt.h"
38 #include "libavutil/mem_internal.h"
39 #include "libavutil/pixdesc.h"
40 #include "avfilter.h"
41 #include "internal.h"
42 #include "video.h"
43
44 typedef struct OWDenoiseContext {
45 const AVClass *class;
46 double luma_strength;
47 double chroma_strength;
48 int depth;
49 float *plane[16+1][4];
50 int linesize;
51 int hsub, vsub;
52 int pixel_depth;
53 } OWDenoiseContext;
54
55 #define OFFSET(x) offsetof(OWDenoiseContext, x)
56 #define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM
57 static const AVOption owdenoise_options[] = {
58 { "depth", "set depth", OFFSET(depth), AV_OPT_TYPE_INT, {.i64 = 8}, 8, 16, FLAGS },
59 { "luma_strength", "set luma strength", OFFSET(luma_strength), AV_OPT_TYPE_DOUBLE, {.dbl = 1.0}, 0, 1000, FLAGS },
60 { "ls", "set luma strength", OFFSET(luma_strength), AV_OPT_TYPE_DOUBLE, {.dbl = 1.0}, 0, 1000, FLAGS },
61 { "chroma_strength", "set chroma strength", OFFSET(chroma_strength), AV_OPT_TYPE_DOUBLE, {.dbl = 1.0}, 0, 1000, FLAGS },
62 { "cs", "set chroma strength", OFFSET(chroma_strength), AV_OPT_TYPE_DOUBLE, {.dbl = 1.0}, 0, 1000, FLAGS },
63 { NULL }
64 };
65
66 AVFILTER_DEFINE_CLASS(owdenoise);
67
68 DECLARE_ALIGNED(8, static const uint8_t, dither)[8][8] = {
69 { 0, 48, 12, 60, 3, 51, 15, 63 },
70 { 32, 16, 44, 28, 35, 19, 47, 31 },
71 { 8, 56, 4, 52, 11, 59, 7, 55 },
72 { 40, 24, 36, 20, 43, 27, 39, 23 },
73 { 2, 50, 14, 62, 1, 49, 13, 61 },
74 { 34, 18, 46, 30, 33, 17, 45, 29 },
75 { 10, 58, 6, 54, 9, 57, 5, 53 },
76 { 42, 26, 38, 22, 41, 25, 37, 21 },
77 };
78
79 static const double coeff[2][5] = {
80 {
81 0.6029490182363579 * M_SQRT2,
82 0.2668641184428723 * M_SQRT2,
83 -0.07822326652898785 * M_SQRT2,
84 -0.01686411844287495 * M_SQRT2,
85 0.02674875741080976 * M_SQRT2,
86 },{
87 1.115087052456994 / M_SQRT2,
88 -0.5912717631142470 / M_SQRT2,
89 -0.05754352622849957 / M_SQRT2,
90 0.09127176311424948 / M_SQRT2,
91 }
92 };
93
94 static const double icoeff[2][5] = {
95 {
96 1.115087052456994 / M_SQRT2,
97 0.5912717631142470 / M_SQRT2,
98 -0.05754352622849957 / M_SQRT2,
99 -0.09127176311424948 / M_SQRT2,
100 },{
101 0.6029490182363579 * M_SQRT2,
102 -0.2668641184428723 * M_SQRT2,
103 -0.07822326652898785 * M_SQRT2,
104 0.01686411844287495 * M_SQRT2,
105 0.02674875741080976 * M_SQRT2,
106 }
107 };
108
109
110 334400 static inline void decompose(float *dst_l, float *dst_h, const float *src,
111 int linesize, int w)
112 {
113 int x, i;
114
2/2
✓ Branch 0 taken 4608000 times.
✓ Branch 1 taken 334400 times.
4942400 for (x = 0; x < w; x++) {
115 4608000 double sum_l = src[x * linesize] * coeff[0][0];
116 4608000 double sum_h = src[x * linesize] * coeff[1][0];
117
2/2
✓ Branch 0 taken 18432000 times.
✓ Branch 1 taken 4608000 times.
23040000 for (i = 1; i <= 4; i++) {
118 18432000 const double s = src[avpriv_mirror(x - i, w - 1) * linesize]
119 18432000 + src[avpriv_mirror(x + i, w - 1) * linesize];
120
121 18432000 sum_l += coeff[0][i] * s;
122 18432000 sum_h += coeff[1][i] * s;
123 }
124 4608000 dst_l[x * linesize] = sum_l;
125 4608000 dst_h[x * linesize] = sum_h;
126 }
127 334400 }
128
129 334400 static inline void compose(float *dst, const float *src_l, const float *src_h,
130 int linesize, int w)
131 {
132 int x, i;
133
2/2
✓ Branch 0 taken 4608000 times.
✓ Branch 1 taken 334400 times.
4942400 for (x = 0; x < w; x++) {
134 4608000 double sum_l = src_l[x * linesize] * icoeff[0][0];
135 4608000 double sum_h = src_h[x * linesize] * icoeff[1][0];
136
2/2
✓ Branch 0 taken 18432000 times.
✓ Branch 1 taken 4608000 times.
23040000 for (i = 1; i <= 4; i++) {
137 18432000 const int x0 = avpriv_mirror(x - i, w - 1) * linesize;
138 18432000 const int x1 = avpriv_mirror(x + i, w - 1) * linesize;
139
140 18432000 sum_l += icoeff[0][i] * (src_l[x0] + src_l[x1]);
141 18432000 sum_h += icoeff[1][i] * (src_h[x0] + src_h[x1]);
142 }
143 4608000 dst[x * linesize] = (sum_l + sum_h) * 0.5;
144 }
145 334400 }
146
147 114 static inline void decompose2D(float *dst_l, float *dst_h, const float *src,
148 int xlinesize, int ylinesize,
149 int step, int w, int h)
150 {
151 int y, x;
152
2/2
✓ Branch 0 taken 22880 times.
✓ Branch 1 taken 114 times.
22994 for (y = 0; y < h; y++)
153
2/2
✓ Branch 0 taken 334400 times.
✓ Branch 1 taken 22880 times.
357280 for (x = 0; x < step; x++)
154 334400 decompose(dst_l + ylinesize*y + xlinesize*x,
155 334400 dst_h + ylinesize*y + xlinesize*x,
156 334400 src + ylinesize*y + xlinesize*x,
157 334400 step * xlinesize, (w - x + step - 1) / step);
158 114 }
159
160 114 static inline void compose2D(float *dst, const float *src_l, const float *src_h,
161 int xlinesize, int ylinesize,
162 int step, int w, int h)
163 {
164 int y, x;
165
2/2
✓ Branch 0 taken 22880 times.
✓ Branch 1 taken 114 times.
22994 for (y = 0; y < h; y++)
166
2/2
✓ Branch 0 taken 334400 times.
✓ Branch 1 taken 22880 times.
357280 for (x = 0; x < step; x++)
167 334400 compose(dst + ylinesize*y + xlinesize*x,
168 334400 src_l + ylinesize*y + xlinesize*x,
169 334400 src_h + ylinesize*y + xlinesize*x,
170 334400 step * xlinesize, (w - x + step - 1) / step);
171 114 }
172
173 38 static void decompose2D2(float *dst[4], float *src, float *temp[2],
174 int linesize, int step, int w, int h)
175 {
176 38 decompose2D(temp[0], temp[1], src, 1, linesize, step, w, h);
177 38 decompose2D( dst[0], dst[1], temp[0], linesize, 1, step, h, w);
178 38 decompose2D( dst[2], dst[3], temp[1], linesize, 1, step, h, w);
179 38 }
180
181 38 static void compose2D2(float *dst, float *src[4], float *temp[2],
182 int linesize, int step, int w, int h)
183 {
184 38 compose2D(temp[0], src[0], src[1], linesize, 1, step, h, w);
185 38 compose2D(temp[1], src[2], src[3], linesize, 1, step, h, w);
186 38 compose2D(dst, temp[0], temp[1], 1, linesize, step, w, h);
187 38 }
188
189 6 static void filter(OWDenoiseContext *s,
190 uint8_t *dst, int dst_linesize,
191 const uint8_t *src, int src_linesize,
192 int width, int height, double strength)
193 {
194 6 int x, y, i, j, depth = s->depth;
195
196
4/4
✓ Branch 0 taken 16 times.
✓ Branch 1 taken 12 times.
✓ Branch 2 taken 6 times.
✓ Branch 3 taken 6 times.
28 while (1<<depth > width || 1<<depth > height)
197 22 depth--;
198
199
1/2
✓ Branch 0 taken 6 times.
✗ Branch 1 not taken.
6 if (s->pixel_depth <= 8) {
200
2/2
✓ Branch 0 taken 960 times.
✓ Branch 1 taken 6 times.
966 for (y = 0; y < height; y++)
201
2/2
✓ Branch 0 taken 230400 times.
✓ Branch 1 taken 960 times.
231360 for(x = 0; x < width; x++)
202 230400 s->plane[0][0][y*s->linesize + x] = src[y*src_linesize + x];
203 } else {
204 const uint16_t *src16 = (const uint16_t *)src;
205
206 src_linesize /= 2;
207 for (y = 0; y < height; y++)
208 for(x = 0; x < width; x++)
209 s->plane[0][0][y*s->linesize + x] = src16[y*src_linesize + x];
210 }
211
212
2/2
✓ Branch 0 taken 38 times.
✓ Branch 1 taken 6 times.
44 for (i = 0; i < depth; i++)
213 38 decompose2D2(s->plane[i + 1], s->plane[i][0], s->plane[0] + 1, s->linesize, 1<<i, width, height);
214
215
2/2
✓ Branch 0 taken 38 times.
✓ Branch 1 taken 6 times.
44 for (i = 0; i < depth; i++) {
216
2/2
✓ Branch 0 taken 114 times.
✓ Branch 1 taken 38 times.
152 for (j = 1; j < 4; j++) {
217
2/2
✓ Branch 0 taken 18720 times.
✓ Branch 1 taken 114 times.
18834 for (y = 0; y < height; y++) {
218
2/2
✓ Branch 0 taken 4608000 times.
✓ Branch 1 taken 18720 times.
4626720 for (x = 0; x < width; x++) {
219 4608000 double v = s->plane[i + 1][j][y*s->linesize + x];
220
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 4608000 times.
4608000 if (v > strength) v -= strength;
221
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 4608000 times.
4608000 else if (v < -strength) v += strength;
222 4608000 else v = 0;
223 4608000 s->plane[i + 1][j][x + y*s->linesize] = v;
224 }
225 }
226 }
227 }
228
2/2
✓ Branch 0 taken 38 times.
✓ Branch 1 taken 6 times.
44 for (i = depth-1; i >= 0; i--)
229 38 compose2D2(s->plane[i][0], s->plane[i + 1], s->plane[0] + 1, s->linesize, 1<<i, width, height);
230
231
1/2
✓ Branch 0 taken 6 times.
✗ Branch 1 not taken.
6 if (s->pixel_depth <= 8) {
232
2/2
✓ Branch 0 taken 960 times.
✓ Branch 1 taken 6 times.
966 for (y = 0; y < height; y++) {
233
2/2
✓ Branch 0 taken 230400 times.
✓ Branch 1 taken 960 times.
231360 for (x = 0; x < width; x++) {
234 230400 i = s->plane[0][0][y*s->linesize + x] + dither[x&7][y&7]*(1.0/64) + 1.0/128; // yes the rounding is insane but optimal :)
235
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 230400 times.
230400 if ((unsigned)i > 255U) i = ~(i >> 31);
236 230400 dst[y*dst_linesize + x] = i;
237 }
238 }
239 } else {
240 uint16_t *dst16 = (uint16_t *)dst;
241
242 dst_linesize /= 2;
243 for (y = 0; y < height; y++) {
244 for (x = 0; x < width; x++) {
245 i = s->plane[0][0][y*s->linesize + x];
246 dst16[y*dst_linesize + x] = i;
247 }
248 }
249 }
250 6 }
251
252 2 static int filter_frame(AVFilterLink *inlink, AVFrame *in)
253 {
254 2 AVFilterContext *ctx = inlink->dst;
255 2 OWDenoiseContext *s = ctx->priv;
256 2 AVFilterLink *outlink = ctx->outputs[0];
257 AVFrame *out;
258 2 const int cw = AV_CEIL_RSHIFT(inlink->w, s->hsub);
259 2 const int ch = AV_CEIL_RSHIFT(inlink->h, s->vsub);
260
261
1/2
✓ Branch 1 taken 2 times.
✗ Branch 2 not taken.
2 if (av_frame_is_writable(in)) {
262 2 out = in;
263
264
1/2
✓ Branch 0 taken 2 times.
✗ Branch 1 not taken.
2 if (s->luma_strength > 0)
265 2 filter(s, out->data[0], out->linesize[0], in->data[0], in->linesize[0], inlink->w, inlink->h, s->luma_strength);
266
1/2
✓ Branch 0 taken 2 times.
✗ Branch 1 not taken.
2 if (s->chroma_strength > 0) {
267 2 filter(s, out->data[1], out->linesize[1], in->data[1], in->linesize[1], cw, ch, s->chroma_strength);
268 2 filter(s, out->data[2], out->linesize[2], in->data[2], in->linesize[2], cw, ch, s->chroma_strength);
269 }
270 } else {
271 out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
272 if (!out) {
273 av_frame_free(&in);
274 return AVERROR(ENOMEM);
275 }
276 av_frame_copy_props(out, in);
277
278 if (s->luma_strength > 0) {
279 filter(s, out->data[0], out->linesize[0], in->data[0], in->linesize[0], inlink->w, inlink->h, s->luma_strength);
280 } else {
281 av_image_copy_plane(out->data[0], out->linesize[0], in ->data[0], in ->linesize[0], inlink->w, inlink->h);
282 }
283 if (s->chroma_strength > 0) {
284 filter(s, out->data[1], out->linesize[1], in->data[1], in->linesize[1], cw, ch, s->chroma_strength);
285 filter(s, out->data[2], out->linesize[2], in->data[2], in->linesize[2], cw, ch, s->chroma_strength);
286 } else {
287 av_image_copy_plane(out->data[1], out->linesize[1], in ->data[1], in ->linesize[1], inlink->w, inlink->h);
288 av_image_copy_plane(out->data[2], out->linesize[2], in ->data[2], in ->linesize[2], inlink->w, inlink->h);
289 }
290
291 if (in->data[3])
292 av_image_copy_plane(out->data[3], out->linesize[3],
293 in ->data[3], in ->linesize[3],
294 inlink->w, inlink->h);
295 av_frame_free(&in);
296 }
297
298 2 return ff_filter_frame(outlink, out);
299 }
300
301 static const enum AVPixelFormat pix_fmts[] = {
302 AV_PIX_FMT_YUV444P, AV_PIX_FMT_YUV422P,
303 AV_PIX_FMT_YUV420P, AV_PIX_FMT_YUV411P,
304 AV_PIX_FMT_YUV410P, AV_PIX_FMT_YUV440P,
305 AV_PIX_FMT_YUVA444P, AV_PIX_FMT_YUVA422P,
306 AV_PIX_FMT_YUVA420P,
307 AV_PIX_FMT_YUV420P9, AV_PIX_FMT_YUV422P9, AV_PIX_FMT_YUV444P9,
308 AV_PIX_FMT_YUV420P10, AV_PIX_FMT_YUV422P10, AV_PIX_FMT_YUV444P10,
309 AV_PIX_FMT_YUV440P10,
310 AV_PIX_FMT_YUV444P12, AV_PIX_FMT_YUV422P12, AV_PIX_FMT_YUV420P12,
311 AV_PIX_FMT_YUV440P12,
312 AV_PIX_FMT_YUV444P14, AV_PIX_FMT_YUV422P14, AV_PIX_FMT_YUV420P14,
313 AV_PIX_FMT_YUV420P16, AV_PIX_FMT_YUV422P16, AV_PIX_FMT_YUV444P16,
314 AV_PIX_FMT_NONE
315 };
316
317 1 static int config_input(AVFilterLink *inlink)
318 {
319 int i, j;
320 1 OWDenoiseContext *s = inlink->dst->priv;
321 1 const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(inlink->format);
322 1 const int h = FFALIGN(inlink->h, 16);
323
324 1 s->hsub = desc->log2_chroma_w;
325 1 s->vsub = desc->log2_chroma_h;
326 1 s->pixel_depth = desc->comp[0].depth;
327
328 1 s->linesize = FFALIGN(inlink->w, 16);
329
2/2
✓ Branch 0 taken 4 times.
✓ Branch 1 taken 1 times.
5 for (j = 0; j < 4; j++) {
330
2/2
✓ Branch 0 taken 44 times.
✓ Branch 1 taken 4 times.
48 for (i = 0; i <= s->depth; i++) {
331 44 s->plane[i][j] = av_malloc_array(s->linesize, h * sizeof(s->plane[0][0][0]));
332
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 44 times.
44 if (!s->plane[i][j])
333 return AVERROR(ENOMEM);
334 }
335 }
336 1 return 0;
337 }
338
339 2 static av_cold void uninit(AVFilterContext *ctx)
340 {
341 int i, j;
342 2 OWDenoiseContext *s = ctx->priv;
343
344
2/2
✓ Branch 0 taken 8 times.
✓ Branch 1 taken 2 times.
10 for (j = 0; j < 4; j++)
345
2/2
✓ Branch 0 taken 88 times.
✓ Branch 1 taken 8 times.
96 for (i = 0; i <= s->depth; i++)
346 88 av_freep(&s->plane[i][j]);
347 2 }
348
349 static const AVFilterPad owdenoise_inputs[] = {
350 {
351 .name = "default",
352 .type = AVMEDIA_TYPE_VIDEO,
353 .filter_frame = filter_frame,
354 .config_props = config_input,
355 },
356 };
357
358 const AVFilter ff_vf_owdenoise = {
359 .name = "owdenoise",
360 .description = NULL_IF_CONFIG_SMALL("Denoise using wavelets."),
361 .priv_size = sizeof(OWDenoiseContext),
362 .uninit = uninit,
363 FILTER_INPUTS(owdenoise_inputs),
364 FILTER_OUTPUTS(ff_video_default_filterpad),
365 FILTER_PIXFMTS_ARRAY(pix_fmts),
366 .priv_class = &owdenoise_class,
367 .flags = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC,
368 };
369