1 /*
2 * Copyright (c) 2019 Paul B Mahol
3 *
4 * This file is part of FFmpeg.
5 *
6 * FFmpeg is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
10 *
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with FFmpeg; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 */
20
21 #include "config_components.h"
22
23 #include "libavutil/avstring.h"
24 #include "libavutil/imgutils.h"
25 #include "libavutil/intreadwrite.h"
26 #include "libavutil/opt.h"
27 #include "libavutil/pixdesc.h"
28 #include "libavutil/qsort.h"
29
30 #include "avfilter.h"
31 #include "formats.h"
32 #include "internal.h"
33 #include "framesync.h"
34 #include "video.h"
35
36 typedef struct XMedianContext {
37 const AVClass *class;
38 const AVPixFmtDescriptor *desc;
39 int nb_inputs;
40 int nb_frames;
41 int nb_threads;
42 int planes;
43 float percentile;
44
45 int xmedian;
46 int radius;
47 int index;
48 int depth;
49 int max;
50 int nb_planes;
51 int linesizes[4];
52 int width[4];
53 int height[4];
54
55 uint8_t **data;
56 int *linesize;
57
58 AVFrame **frames;
59 FFFrameSync fs;
60
61 int (*median_frames)(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs);
62 } XMedianContext;
63
64 static const enum AVPixelFormat pixel_fmts[] = {
65 AV_PIX_FMT_GRAY8,
66 AV_PIX_FMT_GRAY9,
67 AV_PIX_FMT_GRAY10,
68 AV_PIX_FMT_GRAY12,
69 AV_PIX_FMT_GRAY14,
70 AV_PIX_FMT_GRAY16,
71 AV_PIX_FMT_YUV410P, AV_PIX_FMT_YUV411P,
72 AV_PIX_FMT_YUV420P, AV_PIX_FMT_YUV422P,
73 AV_PIX_FMT_YUV440P, AV_PIX_FMT_YUV444P,
74 AV_PIX_FMT_YUVJ420P, AV_PIX_FMT_YUVJ422P,
75 AV_PIX_FMT_YUVJ440P, AV_PIX_FMT_YUVJ444P,
76 AV_PIX_FMT_YUVJ411P,
77 AV_PIX_FMT_YUV420P9, AV_PIX_FMT_YUV422P9, AV_PIX_FMT_YUV444P9,
78 AV_PIX_FMT_YUV420P10, AV_PIX_FMT_YUV422P10, AV_PIX_FMT_YUV444P10,
79 AV_PIX_FMT_YUV440P10,
80 AV_PIX_FMT_YUV444P12, AV_PIX_FMT_YUV422P12, AV_PIX_FMT_YUV420P12,
81 AV_PIX_FMT_YUV440P12,
82 AV_PIX_FMT_YUV444P14, AV_PIX_FMT_YUV422P14, AV_PIX_FMT_YUV420P14,
83 AV_PIX_FMT_YUV420P16, AV_PIX_FMT_YUV422P16, AV_PIX_FMT_YUV444P16,
84 AV_PIX_FMT_GBRP, AV_PIX_FMT_GBRP9, AV_PIX_FMT_GBRP10,
85 AV_PIX_FMT_GBRP12, AV_PIX_FMT_GBRP14, AV_PIX_FMT_GBRP16,
86 AV_PIX_FMT_YUVA420P, AV_PIX_FMT_YUVA422P, AV_PIX_FMT_YUVA444P,
87 AV_PIX_FMT_YUVA444P9, AV_PIX_FMT_YUVA444P10, AV_PIX_FMT_YUVA444P12, AV_PIX_FMT_YUVA444P16,
88 AV_PIX_FMT_YUVA422P9, AV_PIX_FMT_YUVA422P10, AV_PIX_FMT_YUVA422P12, AV_PIX_FMT_YUVA422P16,
89 AV_PIX_FMT_YUVA420P9, AV_PIX_FMT_YUVA420P10, AV_PIX_FMT_YUVA420P16,
90 AV_PIX_FMT_GBRAP, AV_PIX_FMT_GBRAP10, AV_PIX_FMT_GBRAP12, AV_PIX_FMT_GBRAP16,
91 AV_PIX_FMT_NONE
92 };
93
init(AVFilterContext * ctx)94 static av_cold int init(AVFilterContext *ctx)
95 {
96 XMedianContext *s = ctx->priv;
97
98 if (!s->xmedian)
99 s->nb_inputs = s->radius * 2 + 1;
100
101 if (s->nb_inputs & 1)
102 s->index = s->radius * 2.f * s->percentile;
103 else
104 s->index = av_clip(s->radius * 2.f * s->percentile, 1, s->nb_inputs - 1);
105 s->frames = av_calloc(s->nb_inputs, sizeof(*s->frames));
106 if (!s->frames)
107 return AVERROR(ENOMEM);
108
109 return 0;
110 }
111
112 typedef struct ThreadData {
113 AVFrame **in, *out;
114 } ThreadData;
115
compare8(const void * p1,const void * p2)116 static int compare8(const void *p1, const void *p2)
117 {
118 int left = *(const uint8_t *)p1;
119 int right = *(const uint8_t *)p2;
120 return FFDIFFSIGN(left, right);
121 }
122
compare16(const void * p1,const void * p2)123 static int compare16(const void *p1, const void *p2)
124 {
125 int left = *(const uint16_t *)p1;
126 int right = *(const uint16_t *)p2;
127 return FFDIFFSIGN(left, right);
128 }
129
130 #define MEDIAN_SLICE(name, type, comparei) \
131 static int median_frames ## name(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs) \
132 { \
133 XMedianContext *s = ctx->priv; \
134 ThreadData *td = arg; \
135 AVFrame **in = td->in; \
136 AVFrame *out = td->out; \
137 const int nb_inputs = s->nb_inputs; \
138 uint8_t **srcf = s->data + jobnr * nb_inputs; \
139 int *linesize = s->linesize + jobnr * nb_inputs; \
140 const int radius = s->radius; \
141 const int index = s->index; \
142 type values[256]; \
143 \
144 for (int p = 0; p < s->nb_planes; p++) { \
145 const int slice_start = (s->height[p] * jobnr) / nb_jobs; \
146 const int slice_end = (s->height[p] * (jobnr+1)) / nb_jobs; \
147 const int width = s->width[p]; \
148 type *dst = (type *)(out->data[p] + slice_start * out->linesize[p]); \
149 ptrdiff_t dst_linesize = out->linesize[p] / sizeof(type); \
150 \
151 if (!((1 << p) & s->planes)) { \
152 av_image_copy_plane((uint8_t *)dst, out->linesize[p], \
153 in[radius]->data[p] + slice_start * in[radius]->linesize[p], \
154 in[radius]->linesize[p], \
155 s->linesizes[p], slice_end - slice_start); \
156 continue; \
157 } \
158 \
159 for (int i = 0; i < nb_inputs; i++) \
160 linesize[i] = in[i]->linesize[p]; \
161 \
162 for (int i = 0; i < nb_inputs; i++) \
163 srcf[i] = in[i]->data[p] + slice_start * linesize[i]; \
164 \
165 for (int y = slice_start; y < slice_end; y++) { \
166 for (int x = 0; x < width; x++) { \
167 for (int i = 0; i < nb_inputs; i++) { \
168 const type *src = (const type *)srcf[i]; \
169 values[i] = src[x]; \
170 } \
171 \
172 AV_QSORT(values, nb_inputs, type, comparei); \
173 if (nb_inputs & 1) \
174 dst[x] = values[index]; \
175 else \
176 dst[x] = (values[index] + values[index - 1]) >> 1; \
177 } \
178 \
179 dst += dst_linesize; \
180 for (int i = 0; i < nb_inputs; i++) \
181 srcf[i] += linesize[i]; \
182 } \
183 } \
184 \
185 return 0; \
186 }
187
188 MEDIAN_SLICE(8, uint8_t, compare8)
189 MEDIAN_SLICE(16, uint16_t, compare16)
190
update_index(XMedianContext * s)191 static void update_index(XMedianContext *s)
192 {
193 if (s->nb_inputs & 1)
194 s->index = s->radius * 2.f * s->percentile;
195 else
196 s->index = av_clip(s->radius * 2.f * s->percentile, 1, s->nb_inputs - 1);
197 }
198
process_frame(FFFrameSync * fs)199 static int process_frame(FFFrameSync *fs)
200 {
201 AVFilterContext *ctx = fs->parent;
202 AVFilterLink *outlink = ctx->outputs[0];
203 XMedianContext *s = fs->opaque;
204 AVFrame **in = s->frames;
205 AVFrame *out;
206 ThreadData td;
207 int i, ret;
208
209 update_index(s);
210
211 for (i = 0; i < s->nb_inputs; i++) {
212 if ((ret = ff_framesync_get_frame(&s->fs, i, &in[i], 0)) < 0)
213 return ret;
214 }
215
216 if (ctx->is_disabled) {
217 out = av_frame_clone(in[0]);
218 } else {
219 out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
220 }
221 if (!out)
222 return AVERROR(ENOMEM);
223 out->pts = av_rescale_q(s->fs.pts, s->fs.time_base, outlink->time_base);
224
225 if (!ctx->is_disabled) {
226 td.in = in;
227 td.out = out;
228 ff_filter_execute(ctx, s->median_frames, &td, NULL,
229 FFMIN(s->height[1], s->nb_threads));
230 }
231
232 return ff_filter_frame(outlink, out);
233 }
234
config_output(AVFilterLink * outlink)235 static int config_output(AVFilterLink *outlink)
236 {
237 AVFilterContext *ctx = outlink->src;
238 XMedianContext *s = ctx->priv;
239 AVRational frame_rate = ctx->inputs[0]->frame_rate;
240 AVRational sar = ctx->inputs[0]->sample_aspect_ratio;
241 AVFilterLink *inlink = ctx->inputs[0];
242 int height = ctx->inputs[0]->h;
243 int width = ctx->inputs[0]->w;
244 FFFrameSyncIn *in;
245 int i, ret;
246
247 for (int i = 1; i < s->nb_inputs && s->xmedian; i++) {
248 if (ctx->inputs[i]->h != height || ctx->inputs[i]->w != width) {
249 av_log(ctx, AV_LOG_ERROR, "Input %d size (%dx%d) does not match input %d size (%dx%d).\n", i, ctx->inputs[i]->w, ctx->inputs[i]->h, 0, width, height);
250 return AVERROR(EINVAL);
251 }
252 }
253
254 s->desc = av_pix_fmt_desc_get(outlink->format);
255 if (!s->desc)
256 return AVERROR_BUG;
257 s->nb_planes = av_pix_fmt_count_planes(outlink->format);
258 s->depth = s->desc->comp[0].depth;
259 s->max = (1 << s->depth) - 1;
260 s->nb_threads = ff_filter_get_nb_threads(ctx);
261
262 if (s->depth <= 8)
263 s->median_frames = median_frames8;
264 else
265 s->median_frames = median_frames16;
266
267 if ((ret = av_image_fill_linesizes(s->linesizes, inlink->format, inlink->w)) < 0)
268 return ret;
269
270 s->width[1] = s->width[2] = AV_CEIL_RSHIFT(inlink->w, s->desc->log2_chroma_w);
271 s->width[0] = s->width[3] = inlink->w;
272 s->height[1] = s->height[2] = AV_CEIL_RSHIFT(inlink->h, s->desc->log2_chroma_h);
273 s->height[0] = s->height[3] = inlink->h;
274
275 s->data = av_calloc(s->nb_threads * s->nb_inputs, sizeof(*s->data));
276 if (!s->data)
277 return AVERROR(ENOMEM);
278
279 s->linesize = av_calloc(s->nb_threads * s->nb_inputs, sizeof(*s->linesize));
280 if (!s->linesize)
281 return AVERROR(ENOMEM);
282
283 if (!s->xmedian)
284 return 0;
285
286 outlink->w = width;
287 outlink->h = height;
288 outlink->frame_rate = frame_rate;
289 outlink->sample_aspect_ratio = sar;
290
291 if ((ret = ff_framesync_init(&s->fs, ctx, s->nb_inputs)) < 0)
292 return ret;
293
294 in = s->fs.in;
295 s->fs.opaque = s;
296 s->fs.on_event = process_frame;
297
298 for (i = 0; i < s->nb_inputs; i++) {
299 AVFilterLink *inlink = ctx->inputs[i];
300
301 in[i].time_base = inlink->time_base;
302 in[i].sync = 1;
303 in[i].before = EXT_STOP;
304 in[i].after = EXT_INFINITY;
305 }
306
307 ret = ff_framesync_configure(&s->fs);
308 outlink->time_base = s->fs.time_base;
309
310 return ret;
311 }
312
uninit(AVFilterContext * ctx)313 static av_cold void uninit(AVFilterContext *ctx)
314 {
315 XMedianContext *s = ctx->priv;
316
317 ff_framesync_uninit(&s->fs);
318
319 for (int i = 0; i < s->nb_frames && s->frames && !s->xmedian; i++)
320 av_frame_free(&s->frames[i]);
321 av_freep(&s->frames);
322 av_freep(&s->data);
323 av_freep(&s->linesize);
324 }
325
activate(AVFilterContext * ctx)326 static int activate(AVFilterContext *ctx)
327 {
328 XMedianContext *s = ctx->priv;
329 return ff_framesync_activate(&s->fs);
330 }
331
332 #if CONFIG_XMEDIAN_FILTER
xmedian_init(AVFilterContext * ctx)333 static av_cold int xmedian_init(AVFilterContext *ctx)
334 {
335 XMedianContext *s = ctx->priv;
336 int ret;
337
338 s->xmedian = 1;
339
340 s->radius = s->nb_inputs / 2;
341
342 for (int i = 0; i < s->nb_inputs; i++) {
343 AVFilterPad pad = { 0 };
344
345 pad.type = AVMEDIA_TYPE_VIDEO;
346 pad.name = av_asprintf("input%d", i);
347 if (!pad.name)
348 return AVERROR(ENOMEM);
349
350 if ((ret = ff_append_inpad_free_name(ctx, &pad)) < 0)
351 return ret;
352 }
353
354 return init(ctx);
355 }
356
357 #define OFFSET(x) offsetof(XMedianContext, x)
358 #define FLAGS AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_FILTERING_PARAM
359 #define TFLAGS AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_FILTERING_PARAM | AV_OPT_FLAG_RUNTIME_PARAM
360
361 static const AVOption xmedian_options[] = {
362 { "inputs", "set number of inputs", OFFSET(nb_inputs), AV_OPT_TYPE_INT, {.i64=3}, 3, 255, .flags = FLAGS },
363 { "planes", "set planes to filter", OFFSET(planes), AV_OPT_TYPE_INT, {.i64=15}, 0, 15, .flags =TFLAGS },
364 { "percentile", "set percentile", OFFSET(percentile),AV_OPT_TYPE_FLOAT,{.dbl=0.5}, 0, 1, .flags =TFLAGS },
365 { NULL },
366 };
367
368 static const AVFilterPad outputs[] = {
369 {
370 .name = "default",
371 .type = AVMEDIA_TYPE_VIDEO,
372 .config_props = config_output,
373 },
374 };
375
376 FRAMESYNC_DEFINE_CLASS(xmedian, XMedianContext, fs);
377
378 const AVFilter ff_vf_xmedian = {
379 .name = "xmedian",
380 .description = NULL_IF_CONFIG_SMALL("Pick median pixels from several video inputs."),
381 .priv_size = sizeof(XMedianContext),
382 .priv_class = &xmedian_class,
383 FILTER_OUTPUTS(outputs),
384 FILTER_PIXFMTS_ARRAY(pixel_fmts),
385 .preinit = xmedian_framesync_preinit,
386 .init = xmedian_init,
387 .uninit = uninit,
388 .activate = activate,
389 .flags = AVFILTER_FLAG_DYNAMIC_INPUTS | AVFILTER_FLAG_SLICE_THREADS |
390 AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL,
391 .process_command = ff_filter_process_command,
392 };
393
394 #endif /* CONFIG_XMEDIAN_FILTER */
395
396 #if CONFIG_TMEDIAN_FILTER
tmedian_filter_frame(AVFilterLink * inlink,AVFrame * in)397 static int tmedian_filter_frame(AVFilterLink *inlink, AVFrame *in)
398 {
399 AVFilterContext *ctx = inlink->dst;
400 AVFilterLink *outlink = ctx->outputs[0];
401 XMedianContext *s = ctx->priv;
402 ThreadData td;
403 AVFrame *out;
404
405 update_index(s);
406
407 if (s->nb_frames < s->nb_inputs) {
408 s->frames[s->nb_frames] = in;
409 s->nb_frames++;
410 if (s->nb_frames < s->nb_inputs)
411 return 0;
412 } else {
413 av_frame_free(&s->frames[0]);
414 memmove(&s->frames[0], &s->frames[1], sizeof(*s->frames) * (s->nb_inputs - 1));
415 s->frames[s->nb_inputs - 1] = in;
416 }
417
418 if (ctx->is_disabled) {
419 out = av_frame_clone(s->frames[0]);
420 if (!out)
421 return AVERROR(ENOMEM);
422 return ff_filter_frame(outlink, out);
423 }
424
425 out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
426 if (!out)
427 return AVERROR(ENOMEM);
428 out->pts = s->frames[0]->pts;
429
430 td.out = out;
431 td.in = s->frames;
432 ff_filter_execute(ctx, s->median_frames, &td, NULL,
433 FFMIN(s->height[1], s->nb_threads));
434
435 return ff_filter_frame(outlink, out);
436 }
437
438 static const AVOption tmedian_options[] = {
439 { "radius", "set median filter radius", OFFSET(radius), AV_OPT_TYPE_INT, {.i64=1}, 1, 127, .flags = FLAGS },
440 { "planes", "set planes to filter", OFFSET(planes), AV_OPT_TYPE_INT, {.i64=15}, 0, 15, .flags =TFLAGS },
441 { "percentile", "set percentile", OFFSET(percentile), AV_OPT_TYPE_FLOAT, {.dbl=0.5}, 0, 1, .flags =TFLAGS },
442 { NULL },
443 };
444
445 static const AVFilterPad tmedian_inputs[] = {
446 {
447 .name = "default",
448 .type = AVMEDIA_TYPE_VIDEO,
449 .filter_frame = tmedian_filter_frame,
450 },
451 };
452
453 static const AVFilterPad tmedian_outputs[] = {
454 {
455 .name = "default",
456 .type = AVMEDIA_TYPE_VIDEO,
457 .config_props = config_output,
458 },
459 };
460
461 AVFILTER_DEFINE_CLASS(tmedian);
462
463 const AVFilter ff_vf_tmedian = {
464 .name = "tmedian",
465 .description = NULL_IF_CONFIG_SMALL("Pick median pixels from successive frames."),
466 .priv_size = sizeof(XMedianContext),
467 .priv_class = &tmedian_class,
468 FILTER_INPUTS(tmedian_inputs),
469 FILTER_OUTPUTS(tmedian_outputs),
470 FILTER_PIXFMTS_ARRAY(pixel_fmts),
471 .init = init,
472 .uninit = uninit,
473 .flags = AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL | AVFILTER_FLAG_SLICE_THREADS,
474 .process_command = ff_filter_process_command,
475 };
476
477 #endif /* CONFIG_TMEDIAN_FILTER */
478