1 /*
2 * Copyright (c) 2018 Paul B Mahol
3 *
4 * This file is part of FFmpeg.
5 *
6 * FFmpeg is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
10 *
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with FFmpeg; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 */
20
21 #include "libavutil/imgutils.h"
22 #include "libavutil/pixdesc.h"
23 #include "libavutil/opt.h"
24 #include "avfilter.h"
25 #include "formats.h"
26 #include "internal.h"
27 #include "video.h"
28
29 typedef struct MaskFunContext {
30 const AVClass *class;
31
32 int low, high;
33 int planes;
34 int fill;
35 int sum;
36
37 int linesize[4];
38 int width[4], height[4];
39 int nb_planes;
40 int depth;
41 int max;
42 uint64_t max_sum;
43
44 AVFrame *empty;
45 int (*getsum)(AVFilterContext *ctx, AVFrame *out);
46 int (*maskfun)(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs);
47 } MaskFunContext;
48
49 #define OFFSET(x) offsetof(MaskFunContext, x)
50 #define VF AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM
51
52 static const AVOption maskfun_options[] = {
53 { "low", "set low threshold", OFFSET(low), AV_OPT_TYPE_INT, {.i64=10}, 0, UINT16_MAX, VF },
54 { "high", "set high threshold", OFFSET(high), AV_OPT_TYPE_INT, {.i64=10}, 0, UINT16_MAX, VF },
55 { "planes", "set planes", OFFSET(planes), AV_OPT_TYPE_INT, {.i64=0xF}, 0, 0xF, VF },
56 { "fill", "set fill value", OFFSET(fill), AV_OPT_TYPE_INT, {.i64=0}, 0, UINT16_MAX, VF },
57 { "sum", "set sum value", OFFSET(sum), AV_OPT_TYPE_INT, {.i64=10}, 0, UINT16_MAX, VF },
58 { NULL }
59 };
60
61 AVFILTER_DEFINE_CLASS(maskfun);
62
query_formats(AVFilterContext * ctx)63 static int query_formats(AVFilterContext *ctx)
64 {
65 static const enum AVPixelFormat pix_fmts[] = {
66 AV_PIX_FMT_YUVA444P, AV_PIX_FMT_YUV444P, AV_PIX_FMT_YUV440P,
67 AV_PIX_FMT_YUVJ444P, AV_PIX_FMT_YUVJ440P,
68 AV_PIX_FMT_YUVA422P, AV_PIX_FMT_YUV422P, AV_PIX_FMT_YUVA420P, AV_PIX_FMT_YUV420P,
69 AV_PIX_FMT_YUVJ422P, AV_PIX_FMT_YUVJ420P,
70 AV_PIX_FMT_YUVJ411P, AV_PIX_FMT_YUV411P, AV_PIX_FMT_YUV410P,
71 AV_PIX_FMT_YUV420P9, AV_PIX_FMT_YUV422P9, AV_PIX_FMT_YUV444P9,
72 AV_PIX_FMT_YUV420P10, AV_PIX_FMT_YUV422P10, AV_PIX_FMT_YUV444P10,
73 AV_PIX_FMT_YUV420P12, AV_PIX_FMT_YUV422P12, AV_PIX_FMT_YUV444P12, AV_PIX_FMT_YUV440P12,
74 AV_PIX_FMT_YUV420P14, AV_PIX_FMT_YUV422P14, AV_PIX_FMT_YUV444P14,
75 AV_PIX_FMT_YUV420P16, AV_PIX_FMT_YUV422P16, AV_PIX_FMT_YUV444P16,
76 AV_PIX_FMT_YUVA420P9, AV_PIX_FMT_YUVA422P9, AV_PIX_FMT_YUVA444P9,
77 AV_PIX_FMT_YUVA420P10, AV_PIX_FMT_YUVA422P10, AV_PIX_FMT_YUVA444P10,
78 AV_PIX_FMT_YUVA420P16, AV_PIX_FMT_YUVA422P16, AV_PIX_FMT_YUVA444P16,
79 AV_PIX_FMT_GBRP, AV_PIX_FMT_GBRP9, AV_PIX_FMT_GBRP10,
80 AV_PIX_FMT_GBRP12, AV_PIX_FMT_GBRP14, AV_PIX_FMT_GBRP16,
81 AV_PIX_FMT_GBRAP, AV_PIX_FMT_GBRAP10, AV_PIX_FMT_GBRAP12, AV_PIX_FMT_GBRAP16,
82 AV_PIX_FMT_GRAY8, AV_PIX_FMT_GRAY9, AV_PIX_FMT_GRAY10, AV_PIX_FMT_GRAY12, AV_PIX_FMT_GRAY14, AV_PIX_FMT_GRAY16,
83 AV_PIX_FMT_NONE
84 };
85
86 return ff_set_common_formats(ctx, ff_make_format_list(pix_fmts));
87 }
88
filter_frame(AVFilterLink * inlink,AVFrame * frame)89 static int filter_frame(AVFilterLink *inlink, AVFrame *frame)
90 {
91 AVFilterContext *ctx = inlink->dst;
92 MaskFunContext *s = ctx->priv;
93 AVFilterLink *outlink = ctx->outputs[0];
94
95 if (s->getsum(ctx, frame)) {
96 AVFrame *out = av_frame_clone(s->empty);
97
98 if (!out) {
99 av_frame_free(&frame);
100 return AVERROR(ENOMEM);
101 }
102 out->pts = frame->pts;
103 av_frame_free(&frame);
104
105 return ff_filter_frame(outlink, out);
106 }
107
108 ctx->internal->execute(ctx, s->maskfun, frame, NULL,
109 FFMIN(s->height[1], ff_filter_get_nb_threads(ctx)));
110
111 return ff_filter_frame(outlink, frame);
112 }
113
114 #define GETSUM(name, type, div) \
115 static int getsum##name(AVFilterContext *ctx, AVFrame *out) \
116 { \
117 MaskFunContext *s = ctx->priv; \
118 uint64_t sum = 0; \
119 int p; \
120 \
121 for (p = 0; p < s->nb_planes; p++) { \
122 const int linesize = out->linesize[p] / div; \
123 const int w = s->width[p]; \
124 const int h = s->height[p]; \
125 type *dst = (type *)out->data[p]; \
126 \
127 if (!((1 << p) & s->planes)) \
128 continue; \
129 \
130 for (int y = 0; y < h; y++) { \
131 for (int x = 0; x < w; x++) \
132 sum += dst[x]; \
133 if (sum >= s->max_sum) \
134 return 1; \
135 dst += linesize; \
136 } \
137 } \
138 \
139 return 0; \
140 }
141
142 GETSUM(8, uint8_t, 1)
143 GETSUM(16, uint16_t, 2)
144
145 #define MASKFUN(name, type, div) \
146 static int maskfun##name(AVFilterContext *ctx, void *arg, \
147 int jobnr, int nb_jobs) \
148 { \
149 MaskFunContext *s = ctx->priv; \
150 AVFrame *out = arg; \
151 const int low = s->low; \
152 const int high = s->high; \
153 const int max = s->max; \
154 int p; \
155 \
156 for (p = 0; p < s->nb_planes; p++) { \
157 const int linesize = out->linesize[p] / div; \
158 const int w = s->width[p]; \
159 const int h = s->height[p]; \
160 const int slice_start = (h * jobnr) / nb_jobs; \
161 const int slice_end = (h * (jobnr+1)) / nb_jobs; \
162 type *dst = (type *)out->data[p] + slice_start * linesize; \
163 \
164 if (!((1 << p) & s->planes)) \
165 continue; \
166 \
167 for (int y = slice_start; y < slice_end; y++) { \
168 for (int x = 0; x < w; x++) { \
169 if (dst[x] <= low) \
170 dst[x] = 0; \
171 else if (dst[x] > high) \
172 dst[x] = max; \
173 } \
174 \
175 dst += linesize; \
176 } \
177 } \
178 \
179 return 0; \
180 }
181
182 MASKFUN(8, uint8_t, 1)
183 MASKFUN(16, uint16_t, 2)
184
config_input(AVFilterLink * inlink)185 static int config_input(AVFilterLink *inlink)
186 {
187 AVFilterContext *ctx = inlink->dst;
188 MaskFunContext *s = ctx->priv;
189 const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(inlink->format);
190 int vsub, hsub, ret;
191
192 s->nb_planes = av_pix_fmt_count_planes(inlink->format);
193
194 if ((ret = av_image_fill_linesizes(s->linesize, inlink->format, inlink->w)) < 0)
195 return ret;
196
197 hsub = desc->log2_chroma_w;
198 vsub = desc->log2_chroma_h;
199 s->height[1] = s->height[2] = AV_CEIL_RSHIFT(inlink->h, vsub);
200 s->height[0] = s->height[3] = inlink->h;
201 s->width[1] = s->width[2] = AV_CEIL_RSHIFT(inlink->w, hsub);
202 s->width[0] = s->width[3] = inlink->w;
203
204 s->depth = desc->comp[0].depth;
205 s->max = (1 << s->depth) - 1;
206 s->fill = FFMIN(s->fill, s->max);
207
208 if (s->depth == 8) {
209 s->maskfun = maskfun8;
210 s->getsum = getsum8;
211 } else {
212 s->maskfun = maskfun16;
213 s->getsum = getsum16;
214 }
215
216 s->empty = ff_get_video_buffer(inlink, inlink->w, inlink->h);
217 if (!s->empty)
218 return AVERROR(ENOMEM);
219
220 if (s->depth == 8) {
221 for (int p = 0; p < s->nb_planes; p++) {
222 uint8_t *dst = s->empty->data[p];
223
224 for (int y = 0; y < s->height[p]; y++) {
225 memset(dst, s->fill, s->width[p]);
226 dst += s->empty->linesize[p];
227 }
228 }
229 } else {
230 for (int p = 0; p < s->nb_planes; p++) {
231 uint16_t *dst = (uint16_t *)s->empty->data[p];
232
233 for (int y = 0; y < s->height[p]; y++) {
234 for (int x = 0; x < s->width[p]; x++)
235 dst[x] = s->fill;
236 dst += s->empty->linesize[p] / 2;
237 }
238 }
239 }
240
241 s->max_sum = 0;
242 for (int p = 0; p < s->nb_planes; p++) {
243 if (!((1 << p) & s->planes))
244 continue;
245 s->max_sum += (uint64_t)s->sum * s->width[p] * s->height[p];
246 }
247
248 return 0;
249 }
250
uninit(AVFilterContext * ctx)251 static av_cold void uninit(AVFilterContext *ctx)
252 {
253 MaskFunContext *s = ctx->priv;
254
255 av_frame_free(&s->empty);
256 }
257
258 static const AVFilterPad maskfun_inputs[] = {
259 {
260 .name = "default",
261 .type = AVMEDIA_TYPE_VIDEO,
262 .filter_frame = filter_frame,
263 .config_props = config_input,
264 .needs_writable = 1,
265 },
266 { NULL }
267 };
268
269 static const AVFilterPad maskfun_outputs[] = {
270 {
271 .name = "default",
272 .type = AVMEDIA_TYPE_VIDEO,
273 },
274 { NULL }
275 };
276
277 AVFilter ff_vf_maskfun = {
278 .name = "maskfun",
279 .description = NULL_IF_CONFIG_SMALL("Create Mask."),
280 .priv_size = sizeof(MaskFunContext),
281 .query_formats = query_formats,
282 .uninit = uninit,
283 .inputs = maskfun_inputs,
284 .outputs = maskfun_outputs,
285 .priv_class = &maskfun_class,
286 .flags = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC | AVFILTER_FLAG_SLICE_THREADS,
287 };
288