| Line | Branch | Exec | Source |
|---|---|---|---|
| 1 | /* | ||
| 2 | * Copyright (c) 2021 Paul Buxton | ||
| 3 | * | ||
| 4 | * This file is part of FFmpeg. | ||
| 5 | * | ||
| 6 | * FFmpeg is free software; you can redistribute it and/or | ||
| 7 | * modify it under the terms of the GNU Lesser General Public | ||
| 8 | * License as published by the Free Software Foundation; either | ||
| 9 | * version 2.1 of the License, or (at your option) any later version. | ||
| 10 | * | ||
| 11 | * FFmpeg is distributed in the hope that it will be useful, | ||
| 12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
| 13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | ||
| 14 | * Lesser General Public License for more details. | ||
| 15 | * | ||
| 16 | * You should have received a copy of the GNU Lesser General Public | ||
| 17 | * License along with FFmpeg; if not, write to the Free Software | ||
| 18 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | ||
| 19 | */ | ||
| 20 | |||
| 21 | /** | ||
| 22 | * @file | ||
| 23 | * Color correction filter based on | ||
| 24 | * https://www.researchgate.net/publication/275213614_A_New_Color_Correction_Method_for_Underwater_Imaging | ||
| 25 | * | ||
| 26 | */ | ||
| 27 | |||
| 28 | #include "libavutil/imgutils.h" | ||
| 29 | #include "libavutil/mem.h" | ||
| 30 | |||
| 31 | #include "avfilter.h" | ||
| 32 | #include "filters.h" | ||
| 33 | #include "video.h" | ||
| 34 | |||
| 35 | typedef struct ThreadData { | ||
| 36 | AVFrame *in, *out; | ||
| 37 | float l_avg; | ||
| 38 | float a_avg; | ||
| 39 | float b_avg; | ||
| 40 | } ThreadData; | ||
| 41 | |||
| 42 | typedef struct GrayWorldContext { | ||
| 43 | float *tmpplab; | ||
| 44 | int *line_count_pels; | ||
| 45 | float *line_sum; | ||
| 46 | } GrayWorldContext; | ||
| 47 | |||
| 48 | ✗ | static void apply_matrix(const float matrix[3][3], const float input[3], float output[3]) | |
| 49 | { | ||
| 50 | ✗ | output[0] = matrix[0][0] * input[0] + matrix[0][1] * input[1] + matrix[0][2] * input[2]; | |
| 51 | ✗ | output[1] = matrix[1][0] * input[0] + matrix[1][1] * input[1] + matrix[1][2] * input[2]; | |
| 52 | ✗ | output[2] = matrix[2][0] * input[0] + matrix[2][1] * input[1] + matrix[2][2] * input[2]; | |
| 53 | ✗ | } | |
| 54 | |||
| 55 | static const float lms2lab[3][3] = { | ||
| 56 | {0.5774, 0.5774, 0.5774}, | ||
| 57 | {0.40825, 0.40825, -0.816458}, | ||
| 58 | {0.707, -0.707, 0} | ||
| 59 | }; | ||
| 60 | |||
| 61 | static const float lab2lms[3][3] = { | ||
| 62 | {0.57735, 0.40825, 0.707}, | ||
| 63 | {0.57735, 0.40825, -0.707}, | ||
| 64 | {0.57735, -0.8165, 0} | ||
| 65 | }; | ||
| 66 | |||
| 67 | static const float rgb2lms[3][3] = { | ||
| 68 | {0.3811, 0.5783, 0.0402}, | ||
| 69 | {0.1967, 0.7244, 0.0782}, | ||
| 70 | {0.0241, 0.1288, 0.8444} | ||
| 71 | }; | ||
| 72 | |||
| 73 | static const float lms2rgb[3][3] = { | ||
| 74 | {4.4679, -3.5873, 0.1193}, | ||
| 75 | {-1.2186, 2.3809, -0.1624}, | ||
| 76 | {0.0497, -0.2439, 1.2045} | ||
| 77 | }; | ||
| 78 | |||
| 79 | /** | ||
| 80 | * Convert from Linear RGB to logspace LAB | ||
| 81 | * | ||
| 82 | * @param rgb Input array of rgb components | ||
| 83 | * @param lab output array of lab components | ||
| 84 | */ | ||
| 85 | ✗ | static void rgb2lab(const float rgb[3], float lab[3]) | |
| 86 | { | ||
| 87 | float lms[3]; | ||
| 88 | |||
| 89 | ✗ | apply_matrix(rgb2lms, rgb, lms); | |
| 90 | ✗ | lms[0] = lms[0] > 0.f ? logf(lms[0]) : -1024.f; | |
| 91 | ✗ | lms[1] = lms[1] > 0.f ? logf(lms[1]) : -1024.f; | |
| 92 | ✗ | lms[2] = lms[2] > 0.f ? logf(lms[2]) : -1024.f; | |
| 93 | ✗ | apply_matrix(lms2lab, lms, lab); | |
| 94 | ✗ | } | |
| 95 | |||
| 96 | /** | ||
| 97 | * Convert from Logspace LAB to Linear RGB | ||
| 98 | * | ||
| 99 | * @param lab input array of lab components | ||
| 100 | * @param rgb output array of rgb components | ||
| 101 | */ | ||
| 102 | ✗ | static void lab2rgb(const float lab[3], float rgb[3]) | |
| 103 | { | ||
| 104 | float lms[3]; | ||
| 105 | |||
| 106 | ✗ | apply_matrix(lab2lms, lab, lms); | |
| 107 | ✗ | lms[0] = expf(lms[0]); | |
| 108 | ✗ | lms[1] = expf(lms[1]); | |
| 109 | ✗ | lms[2] = expf(lms[2]); | |
| 110 | ✗ | apply_matrix(lms2rgb, lms, rgb); | |
| 111 | ✗ | } | |
| 112 | |||
| 113 | /** | ||
| 114 | * Convert a frame from linear RGB to logspace LAB, and accumulate channel totals for each row | ||
| 115 | * Convert from RGB -> lms using equation 4 in color transfer paper. | ||
| 116 | * | ||
| 117 | * @param ctx Filter context | ||
| 118 | * @param arg Thread data pointer | ||
| 119 | * @param jobnr job number | ||
| 120 | * @param nb_jobs number of jobs | ||
| 121 | */ | ||
| 122 | ✗ | static int convert_frame(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs) | |
| 123 | { | ||
| 124 | ✗ | GrayWorldContext *s = ctx->priv; | |
| 125 | ✗ | ThreadData *td = arg; | |
| 126 | ✗ | AVFrame *in = td->in; | |
| 127 | ✗ | AVFrame *out = td->out; | |
| 128 | ✗ | AVFilterLink *outlink = ctx->outputs[0]; | |
| 129 | ✗ | const int slice_start = (out->height * jobnr) / nb_jobs; | |
| 130 | ✗ | const int slice_end = (out->height * (jobnr + 1)) / nb_jobs; | |
| 131 | float rgb[3], lab[3]; | ||
| 132 | |||
| 133 | ✗ | for (int i = slice_start; i < slice_end; i++) { | |
| 134 | ✗ | float *b_in_row = (float *)(in->data[1] + i * in->linesize[1]); | |
| 135 | ✗ | float *g_in_row = (float *)(in->data[0] + i * in->linesize[0]); | |
| 136 | ✗ | float *r_in_row = (float *)(in->data[2] + i * in->linesize[2]); | |
| 137 | ✗ | float *acur = s->tmpplab + i * outlink->w + outlink->w * outlink->h; | |
| 138 | ✗ | float *bcur = s->tmpplab + i * outlink->w + 2 * outlink->w * outlink->h; | |
| 139 | ✗ | float *lcur = s->tmpplab + i * outlink->w; | |
| 140 | |||
| 141 | ✗ | s->line_sum[i] = 0.f; | |
| 142 | ✗ | s->line_sum[i + outlink->h] = 0.f; | |
| 143 | ✗ | s->line_count_pels[i] = 0; | |
| 144 | |||
| 145 | ✗ | for (int j = 0; j < outlink->w; j++) { | |
| 146 | ✗ | rgb[0] = r_in_row[j]; | |
| 147 | ✗ | rgb[1] = g_in_row[j]; | |
| 148 | ✗ | rgb[2] = b_in_row[j]; | |
| 149 | ✗ | rgb2lab(rgb, lab); | |
| 150 | ✗ | *(lcur++) = lab[0]; | |
| 151 | ✗ | *(acur++) = lab[1]; | |
| 152 | ✗ | *(bcur++) = lab[2]; | |
| 153 | ✗ | s->line_sum[i] += lab[1]; | |
| 154 | ✗ | s->line_sum[i + outlink->h] += lab[2]; | |
| 155 | ✗ | s->line_count_pels[i]++; | |
| 156 | } | ||
| 157 | } | ||
| 158 | ✗ | return 0; | |
| 159 | } | ||
| 160 | |||
| 161 | /** | ||
| 162 | * Sum the channel totals and compute the mean for each channel | ||
| 163 | * | ||
| 164 | * @param s Frame context | ||
| 165 | * @param td thread data | ||
| 166 | */ | ||
| 167 | ✗ | static void compute_correction(GrayWorldContext *s, ThreadData *td) | |
| 168 | { | ||
| 169 | ✗ | float asum = 0.f, bsum = 0.f; | |
| 170 | ✗ | int pixels = 0; | |
| 171 | |||
| 172 | ✗ | for (int y = 0; y < td->out->height; y++) { | |
| 173 | ✗ | asum += s->line_sum[y]; | |
| 174 | ✗ | bsum += s->line_sum[y + td->out->height]; | |
| 175 | ✗ | pixels += s->line_count_pels[y]; | |
| 176 | } | ||
| 177 | |||
| 178 | ✗ | td->a_avg = asum / pixels; | |
| 179 | ✗ | td->b_avg = bsum / pixels; | |
| 180 | ✗ | } | |
| 181 | |||
| 182 | /** | ||
| 183 | * Subtract the mean logspace AB values from each pixel. | ||
| 184 | * | ||
| 185 | * @param ctx Filter context | ||
| 186 | * @param arg Thread data pointer | ||
| 187 | * @param jobnr job number | ||
| 188 | * @param nb_jobs number of jobs | ||
| 189 | */ | ||
| 190 | ✗ | static int correct_frame(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs) | |
| 191 | { | ||
| 192 | ✗ | GrayWorldContext *s = ctx->priv; | |
| 193 | ✗ | ThreadData *td = arg; | |
| 194 | ✗ | AVFrame *out = td->out; | |
| 195 | ✗ | AVFilterLink *outlink = ctx->outputs[0]; | |
| 196 | ✗ | const int slice_start = (out->height * jobnr) / nb_jobs; | |
| 197 | ✗ | const int slice_end = (out->height * (jobnr + 1)) / nb_jobs; | |
| 198 | float rgb[3], lab[3]; | ||
| 199 | |||
| 200 | ✗ | for (int i = slice_start; i < slice_end; i++) { | |
| 201 | ✗ | float *g_out_row = (float *)(out->data[0] + i * out->linesize[0]); | |
| 202 | ✗ | float *b_out_row = (float *)(out->data[1] + i * out->linesize[1]); | |
| 203 | ✗ | float *r_out_row = (float *)(out->data[2] + i * out->linesize[2]); | |
| 204 | ✗ | float *lcur = s->tmpplab + i * outlink->w; | |
| 205 | ✗ | float *acur = s->tmpplab + i * outlink->w + outlink->w * outlink->h; | |
| 206 | ✗ | float *bcur = s->tmpplab + i * outlink->w + 2 * outlink->w * outlink->h; | |
| 207 | |||
| 208 | ✗ | for (int j = 0; j < outlink->w; j++) { | |
| 209 | ✗ | lab[0] = *lcur++; | |
| 210 | ✗ | lab[1] = *acur++; | |
| 211 | ✗ | lab[2] = *bcur++; | |
| 212 | |||
| 213 | // subtract the average for the color channels | ||
| 214 | ✗ | lab[1] -= td->a_avg; | |
| 215 | ✗ | lab[2] -= td->b_avg; | |
| 216 | |||
| 217 | //convert back to linear rgb | ||
| 218 | ✗ | lab2rgb(lab, rgb); | |
| 219 | ✗ | r_out_row[j] = rgb[0]; | |
| 220 | ✗ | g_out_row[j] = rgb[1]; | |
| 221 | ✗ | b_out_row[j] = rgb[2]; | |
| 222 | } | ||
| 223 | } | ||
| 224 | ✗ | return 0; | |
| 225 | } | ||
| 226 | |||
| 227 | ✗ | static int config_input(AVFilterLink *inlink) | |
| 228 | { | ||
| 229 | ✗ | GrayWorldContext *s = inlink->dst->priv; | |
| 230 | |||
| 231 | ✗ | FF_ALLOC_TYPED_ARRAY(s->tmpplab, inlink->h * inlink->w * 3); | |
| 232 | ✗ | FF_ALLOC_TYPED_ARRAY(s->line_count_pels, inlink->h); | |
| 233 | ✗ | FF_ALLOC_TYPED_ARRAY(s->line_sum, inlink->h * 2); | |
| 234 | ✗ | if (!s->tmpplab || !s->line_count_pels || !s->line_sum) | |
| 235 | ✗ | return AVERROR(ENOMEM); | |
| 236 | |||
| 237 | ✗ | return 0; | |
| 238 | } | ||
| 239 | |||
| 240 | ✗ | static av_cold void uninit(AVFilterContext *ctx) | |
| 241 | { | ||
| 242 | ✗ | GrayWorldContext *s = ctx->priv; | |
| 243 | |||
| 244 | ✗ | av_freep(&s->tmpplab); | |
| 245 | ✗ | av_freep(&s->line_count_pels); | |
| 246 | ✗ | av_freep(&s->line_sum); | |
| 247 | ✗ | } | |
| 248 | |||
| 249 | ✗ | static int filter_frame(AVFilterLink *inlink, AVFrame *in) | |
| 250 | { | ||
| 251 | ✗ | AVFilterContext *ctx = inlink->dst; | |
| 252 | ✗ | GrayWorldContext *s = ctx->priv; | |
| 253 | ✗ | AVFilterLink *outlink = ctx->outputs[0]; | |
| 254 | ThreadData td; | ||
| 255 | AVFrame *out; | ||
| 256 | |||
| 257 | ✗ | if (av_frame_is_writable(in)) { | |
| 258 | ✗ | out = in; | |
| 259 | } else { | ||
| 260 | ✗ | out = ff_get_video_buffer(outlink, outlink->w, outlink->h); | |
| 261 | ✗ | if (!out) { | |
| 262 | ✗ | av_frame_free(&in); | |
| 263 | ✗ | return AVERROR(ENOMEM); | |
| 264 | } | ||
| 265 | ✗ | av_frame_copy_props(out, in); | |
| 266 | } | ||
| 267 | /* input and output transfer will be linear */ | ||
| 268 | ✗ | if (in->color_trc == AVCOL_TRC_UNSPECIFIED) { | |
| 269 | ✗ | av_log(ctx, AV_LOG_WARNING, "Untagged transfer, assuming linear light.\n"); | |
| 270 | ✗ | out->color_trc = AVCOL_TRC_LINEAR; | |
| 271 | ✗ | } else if (in->color_trc != AVCOL_TRC_LINEAR) { | |
| 272 | ✗ | av_log(ctx, AV_LOG_WARNING, "Gray world color correction works on linear light only.\n"); | |
| 273 | } | ||
| 274 | |||
| 275 | ✗ | td.in = in; | |
| 276 | ✗ | td.out = out; | |
| 277 | |||
| 278 | ✗ | ff_filter_execute(ctx, convert_frame, &td, NULL, FFMIN(outlink->h, ff_filter_get_nb_threads(ctx))); | |
| 279 | ✗ | compute_correction(s, &td); | |
| 280 | ✗ | ff_filter_execute(ctx, correct_frame, &td, NULL, FFMIN(outlink->h, ff_filter_get_nb_threads(ctx))); | |
| 281 | |||
| 282 | ✗ | if (in != out) { | |
| 283 | ✗ | av_image_copy_plane(out->data[3], out->linesize[3], | |
| 284 | ✗ | in->data[3], in->linesize[3], outlink->w * 4, outlink->h); | |
| 285 | ✗ | av_frame_free(&in); | |
| 286 | } | ||
| 287 | |||
| 288 | ✗ | return ff_filter_frame(outlink, out); | |
| 289 | } | ||
| 290 | |||
| 291 | static const AVFilterPad grayworld_inputs[] = { | ||
| 292 | { | ||
| 293 | .name = "default", | ||
| 294 | .type = AVMEDIA_TYPE_VIDEO, | ||
| 295 | .filter_frame = filter_frame, | ||
| 296 | .config_props = config_input, | ||
| 297 | } | ||
| 298 | }; | ||
| 299 | |||
| 300 | const FFFilter ff_vf_grayworld = { | ||
| 301 | .p.name = "grayworld", | ||
| 302 | .p.description = NULL_IF_CONFIG_SMALL("Adjust white balance using LAB gray world algorithm"), | ||
| 303 | .p.flags = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC | AVFILTER_FLAG_SLICE_THREADS, | ||
| 304 | .priv_size = sizeof(GrayWorldContext), | ||
| 305 | FILTER_INPUTS(grayworld_inputs), | ||
| 306 | FILTER_OUTPUTS(ff_video_default_filterpad), | ||
| 307 | FILTER_PIXFMTS(AV_PIX_FMT_GBRPF32, AV_PIX_FMT_GBRAPF32), | ||
| 308 | .uninit = uninit, | ||
| 309 | }; | ||
| 310 |