1 /*
2 * Copyright (c) 2010 The WebM project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
11
12 // VP8 Set Active and ROI Maps
13 // ===========================
14 //
15 // This is an example demonstrating how to control the VP8 encoder's
16 // ROI and Active maps.
17 //
18 // ROI (Reigon of Interest) maps are a way for the application to assign
19 // each macroblock in the image to a region, and then set quantizer and
20 // filtering parameters on that image.
21 //
22 // Active maps are a way for the application to specify on a
23 // macroblock-by-macroblock basis whether there is any activity in that
24 // macroblock.
25 //
26 //
27 // Configuration
28 // -------------
29 // An ROI map is set on frame 22. If the width of the image in macroblocks
30 // is evenly divisble by 4, then the output will appear to have distinct
31 // columns, where the quantizer, loopfilter, and static threshold differ
32 // from column to column.
33 //
34 // An active map is set on frame 33. If the width of the image in macroblocks
35 // is evenly divisble by 4, then the output will appear to have distinct
36 // columns, where one column will have motion and the next will not.
37 //
38 // The active map is cleared on frame 44.
39 //
40 // Observing The Effects
41 // ---------------------
42 // Use the `simple_decoder` example to decode this sample, and observe
43 // the change in the image at frames 22, 33, and 44.
44
45 #include <stdio.h>
46 #include <stdlib.h>
47 #include <string.h>
48
49 #define VPX_CODEC_DISABLE_COMPAT 1
50 #include "vpx/vp8cx.h"
51 #include "vpx/vpx_encoder.h"
52
53 #include "./tools_common.h"
54 #include "./video_writer.h"
55
56 static const char *exec_name;
57
usage_exit()58 void usage_exit() {
59 fprintf(stderr, "Usage: %s <codec> <width> <height> <infile> <outfile>\n",
60 exec_name);
61 exit(EXIT_FAILURE);
62 }
63
set_roi_map(const vpx_codec_enc_cfg_t * cfg,vpx_codec_ctx_t * codec)64 static void set_roi_map(const vpx_codec_enc_cfg_t *cfg,
65 vpx_codec_ctx_t *codec) {
66 unsigned int i;
67 vpx_roi_map_t roi = {0};
68
69 roi.rows = (cfg->g_h + 15) / 16;
70 roi.cols = (cfg->g_w + 15) / 16;
71
72 roi.delta_q[0] = 0;
73 roi.delta_q[1] = -2;
74 roi.delta_q[2] = -4;
75 roi.delta_q[3] = -6;
76
77 roi.delta_lf[0] = 0;
78 roi.delta_lf[1] = 1;
79 roi.delta_lf[2] = 2;
80 roi.delta_lf[3] = 3;
81
82 roi.static_threshold[0] = 1500;
83 roi.static_threshold[1] = 1000;
84 roi.static_threshold[2] = 500;
85 roi.static_threshold[3] = 0;
86
87 roi.roi_map = (uint8_t *)malloc(roi.rows * roi.cols);
88 for (i = 0; i < roi.rows * roi.cols; ++i)
89 roi.roi_map[i] = i % 4;
90
91 if (vpx_codec_control(codec, VP8E_SET_ROI_MAP, &roi))
92 die_codec(codec, "Failed to set ROI map");
93
94 free(roi.roi_map);
95 }
96
set_active_map(const vpx_codec_enc_cfg_t * cfg,vpx_codec_ctx_t * codec)97 static void set_active_map(const vpx_codec_enc_cfg_t *cfg,
98 vpx_codec_ctx_t *codec) {
99 unsigned int i;
100 vpx_active_map_t map = {0};
101
102 map.rows = (cfg->g_h + 15) / 16;
103 map.cols = (cfg->g_w + 15) / 16;
104
105 map.active_map = (uint8_t *)malloc(map.rows * map.cols);
106 for (i = 0; i < map.rows * map.cols; ++i)
107 map.active_map[i] = i % 2;
108
109 if (vpx_codec_control(codec, VP8E_SET_ACTIVEMAP, &map))
110 die_codec(codec, "Failed to set active map");
111
112 free(map.active_map);
113 }
114
unset_active_map(const vpx_codec_enc_cfg_t * cfg,vpx_codec_ctx_t * codec)115 static void unset_active_map(const vpx_codec_enc_cfg_t *cfg,
116 vpx_codec_ctx_t *codec) {
117 vpx_active_map_t map = {0};
118
119 map.rows = (cfg->g_h + 15) / 16;
120 map.cols = (cfg->g_w + 15) / 16;
121 map.active_map = NULL;
122
123 if (vpx_codec_control(codec, VP8E_SET_ACTIVEMAP, &map))
124 die_codec(codec, "Failed to set active map");
125 }
126
encode_frame(vpx_codec_ctx_t * codec,vpx_image_t * img,int frame_index,VpxVideoWriter * writer)127 static void encode_frame(vpx_codec_ctx_t *codec,
128 vpx_image_t *img,
129 int frame_index,
130 VpxVideoWriter *writer) {
131 vpx_codec_iter_t iter = NULL;
132 const vpx_codec_cx_pkt_t *pkt = NULL;
133 const vpx_codec_err_t res = vpx_codec_encode(codec, img, frame_index, 1, 0,
134 VPX_DL_GOOD_QUALITY);
135 if (res != VPX_CODEC_OK)
136 die_codec(codec, "Failed to encode frame");
137
138 while ((pkt = vpx_codec_get_cx_data(codec, &iter)) != NULL) {
139 if (pkt->kind == VPX_CODEC_CX_FRAME_PKT) {
140 const int keyframe = (pkt->data.frame.flags & VPX_FRAME_IS_KEY) != 0;
141 if (!vpx_video_writer_write_frame(writer,
142 pkt->data.frame.buf,
143 pkt->data.frame.sz,
144 pkt->data.frame.pts)) {
145 die_codec(codec, "Failed to write compressed frame");
146 }
147
148 printf(keyframe ? "K" : ".");
149 fflush(stdout);
150 }
151 }
152 }
153
main(int argc,char ** argv)154 int main(int argc, char **argv) {
155 FILE *infile = NULL;
156 vpx_codec_ctx_t codec = {0};
157 vpx_codec_enc_cfg_t cfg = {0};
158 int frame_count = 0;
159 vpx_image_t raw = {0};
160 vpx_codec_err_t res;
161 VpxVideoInfo info = {0};
162 VpxVideoWriter *writer = NULL;
163 const VpxInterface *encoder = NULL;
164 const int fps = 2; // TODO(dkovalev) add command line argument
165 const double bits_per_pixel_per_frame = 0.067;
166
167 exec_name = argv[0];
168
169 if (argc != 6)
170 die("Invalid number of arguments");
171
172 encoder = get_vpx_encoder_by_name(argv[1]);
173 if (!encoder)
174 die("Unsupported codec.");
175
176 info.codec_fourcc = encoder->fourcc;
177 info.frame_width = strtol(argv[2], NULL, 0);
178 info.frame_height = strtol(argv[3], NULL, 0);
179 info.time_base.numerator = 1;
180 info.time_base.denominator = fps;
181
182 if (info.frame_width <= 0 ||
183 info.frame_height <= 0 ||
184 (info.frame_width % 2) != 0 ||
185 (info.frame_height % 2) != 0) {
186 die("Invalid frame size: %dx%d", info.frame_width, info.frame_height);
187 }
188
189 if (!vpx_img_alloc(&raw, VPX_IMG_FMT_I420, info.frame_width,
190 info.frame_height, 1)) {
191 die("Failed to allocate image.");
192 }
193
194 printf("Using %s\n", vpx_codec_iface_name(encoder->interface()));
195
196 res = vpx_codec_enc_config_default(encoder->interface(), &cfg, 0);
197 if (res)
198 die_codec(&codec, "Failed to get default codec config.");
199
200 cfg.g_w = info.frame_width;
201 cfg.g_h = info.frame_height;
202 cfg.g_timebase.num = info.time_base.numerator;
203 cfg.g_timebase.den = info.time_base.denominator;
204 cfg.rc_target_bitrate = (unsigned int)(bits_per_pixel_per_frame * cfg.g_w *
205 cfg.g_h * fps / 1000);
206 cfg.g_lag_in_frames = 0;
207
208 writer = vpx_video_writer_open(argv[5], kContainerIVF, &info);
209 if (!writer)
210 die("Failed to open %s for writing.", argv[5]);
211
212 if (!(infile = fopen(argv[4], "rb")))
213 die("Failed to open %s for reading.", argv[4]);
214
215 if (vpx_codec_enc_init(&codec, encoder->interface(), &cfg, 0))
216 die_codec(&codec, "Failed to initialize encoder");
217
218 while (vpx_img_read(&raw, infile)) {
219 ++frame_count;
220
221 if (frame_count == 22 && encoder->fourcc == VP8_FOURCC) {
222 set_roi_map(&cfg, &codec);
223 } else if (frame_count == 33) {
224 set_active_map(&cfg, &codec);
225 } else if (frame_count == 44) {
226 unset_active_map(&cfg, &codec);
227 }
228
229 encode_frame(&codec, &raw, frame_count, writer);
230 }
231 encode_frame(&codec, NULL, -1, writer);
232 printf("\n");
233 fclose(infile);
234 printf("Processed %d frames.\n", frame_count);
235
236 vpx_img_free(&raw);
237 if (vpx_codec_destroy(&codec))
238 die_codec(&codec, "Failed to destroy codec.");
239
240 vpx_video_writer_close(writer);
241
242 return EXIT_SUCCESS;
243 }
244