1 /*
2 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
3 *
4 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10 */
11
12 #include <assert.h>
13 #include <limits.h>
14
15 #include "config/aom_scale_rtcd.h"
16
17 #include "aom_dsp/aom_dsp_common.h"
18 #include "aom_dsp/psnr.h"
19 #include "aom_mem/aom_mem.h"
20 #include "aom_ports/mem.h"
21
22 #include "av1/common/av1_common_int.h"
23 #include "av1/common/av1_loopfilter.h"
24 #include "av1/common/quant_common.h"
25
26 #include "av1/encoder/av1_quantize.h"
27 #include "av1/encoder/encoder.h"
28 #include "av1/encoder/picklpf.h"
29
yv12_copy_plane(const YV12_BUFFER_CONFIG * src_bc,YV12_BUFFER_CONFIG * dst_bc,int plane)30 static void yv12_copy_plane(const YV12_BUFFER_CONFIG *src_bc,
31 YV12_BUFFER_CONFIG *dst_bc, int plane) {
32 switch (plane) {
33 case 0: aom_yv12_copy_y(src_bc, dst_bc); break;
34 case 1: aom_yv12_copy_u(src_bc, dst_bc); break;
35 case 2: aom_yv12_copy_v(src_bc, dst_bc); break;
36 default: assert(plane >= 0 && plane <= 2); break;
37 }
38 }
39
av1_get_max_filter_level(const AV1_COMP * cpi)40 int av1_get_max_filter_level(const AV1_COMP *cpi) {
41 if (is_stat_consumption_stage_twopass(cpi)) {
42 return cpi->ppi->twopass.section_intra_rating > 8 ? MAX_LOOP_FILTER * 3 / 4
43 : MAX_LOOP_FILTER;
44 } else {
45 return MAX_LOOP_FILTER;
46 }
47 }
48
try_filter_frame(const YV12_BUFFER_CONFIG * sd,AV1_COMP * const cpi,int filt_level,int partial_frame,int plane,int dir)49 static int64_t try_filter_frame(const YV12_BUFFER_CONFIG *sd,
50 AV1_COMP *const cpi, int filt_level,
51 int partial_frame, int plane, int dir) {
52 MultiThreadInfo *const mt_info = &cpi->mt_info;
53 int num_workers = mt_info->num_mod_workers[MOD_LPF];
54 AV1_COMMON *const cm = &cpi->common;
55 int64_t filt_err;
56
57 assert(plane >= 0 && plane <= 2);
58 int filter_level[2] = { filt_level, filt_level };
59 if (plane == 0 && dir == 0) filter_level[1] = cm->lf.filter_level[1];
60 if (plane == 0 && dir == 1) filter_level[0] = cm->lf.filter_level[0];
61
62 // set base filters for use of av1_get_filter_level when in DELTA_LF mode
63 switch (plane) {
64 case 0:
65 cm->lf.filter_level[0] = filter_level[0];
66 cm->lf.filter_level[1] = filter_level[1];
67 break;
68 case 1: cm->lf.filter_level_u = filter_level[0]; break;
69 case 2: cm->lf.filter_level_v = filter_level[0]; break;
70 }
71
72 // lpf_opt_level = 1 : Enables dual/quad loop-filtering.
73 int lpf_opt_level = is_inter_tx_size_search_level_one(&cpi->sf.tx_sf);
74
75 av1_loop_filter_frame_mt(&cm->cur_frame->buf, cm, &cpi->td.mb.e_mbd, plane,
76 plane + 1, partial_frame, mt_info->workers,
77 num_workers, &mt_info->lf_row_sync, lpf_opt_level);
78
79 filt_err = aom_get_sse_plane(sd, &cm->cur_frame->buf, plane,
80 cm->seq_params->use_highbitdepth);
81
82 // Re-instate the unfiltered frame
83 yv12_copy_plane(&cpi->last_frame_uf, &cm->cur_frame->buf, plane);
84
85 return filt_err;
86 }
87
search_filter_level(const YV12_BUFFER_CONFIG * sd,AV1_COMP * cpi,int partial_frame,const int * last_frame_filter_level,int plane,int dir)88 static int search_filter_level(const YV12_BUFFER_CONFIG *sd, AV1_COMP *cpi,
89 int partial_frame,
90 const int *last_frame_filter_level, int plane,
91 int dir) {
92 const AV1_COMMON *const cm = &cpi->common;
93 const int min_filter_level = 0;
94 const int max_filter_level = av1_get_max_filter_level(cpi);
95 int filt_direction = 0;
96 int64_t best_err;
97 int filt_best;
98
99 // Start the search at the previous frame filter level unless it is now out of
100 // range.
101 int lvl;
102 switch (plane) {
103 case 0:
104 switch (dir) {
105 case 2:
106 lvl = (last_frame_filter_level[0] + last_frame_filter_level[1] + 1) >>
107 1;
108 break;
109 case 0:
110 case 1: lvl = last_frame_filter_level[dir]; break;
111 default: assert(dir >= 0 && dir <= 2); return 0;
112 }
113 break;
114 case 1: lvl = last_frame_filter_level[2]; break;
115 case 2: lvl = last_frame_filter_level[3]; break;
116 default: assert(plane >= 0 && plane <= 2); return 0;
117 }
118 int filt_mid = clamp(lvl, min_filter_level, max_filter_level);
119 int filter_step = filt_mid < 16 ? 4 : filt_mid / 4;
120 // Sum squared error at each filter level
121 int64_t ss_err[MAX_LOOP_FILTER + 1];
122
123 const int use_coarse_search = cpi->sf.lpf_sf.use_coarse_filter_level_search;
124 assert(use_coarse_search <= 1);
125 static const int min_filter_step_lookup[2] = { 0, 2 };
126 // min_filter_step_thesh determines the stopping criteria for the search.
127 // The search is terminated when filter_step equals min_filter_step_thesh.
128 const int min_filter_step_thesh = min_filter_step_lookup[use_coarse_search];
129
130 // Set each entry to -1
131 memset(ss_err, 0xFF, sizeof(ss_err));
132 yv12_copy_plane(&cm->cur_frame->buf, &cpi->last_frame_uf, plane);
133 best_err = try_filter_frame(sd, cpi, filt_mid, partial_frame, plane, dir);
134 filt_best = filt_mid;
135 ss_err[filt_mid] = best_err;
136
137 while (filter_step > min_filter_step_thesh) {
138 const int filt_high = AOMMIN(filt_mid + filter_step, max_filter_level);
139 const int filt_low = AOMMAX(filt_mid - filter_step, min_filter_level);
140
141 // Bias against raising loop filter in favor of lowering it.
142 int64_t bias = (best_err >> (15 - (filt_mid / 8))) * filter_step;
143
144 if ((is_stat_consumption_stage_twopass(cpi)) &&
145 (cpi->ppi->twopass.section_intra_rating < 20))
146 bias = (bias * cpi->ppi->twopass.section_intra_rating) / 20;
147
148 // yx, bias less for large block size
149 if (cm->features.tx_mode != ONLY_4X4) bias >>= 1;
150
151 if (filt_direction <= 0 && filt_low != filt_mid) {
152 // Get Low filter error score
153 if (ss_err[filt_low] < 0) {
154 ss_err[filt_low] =
155 try_filter_frame(sd, cpi, filt_low, partial_frame, plane, dir);
156 }
157 // If value is close to the best so far then bias towards a lower loop
158 // filter value.
159 if (ss_err[filt_low] < (best_err + bias)) {
160 // Was it actually better than the previous best?
161 if (ss_err[filt_low] < best_err) {
162 best_err = ss_err[filt_low];
163 }
164 filt_best = filt_low;
165 }
166 }
167
168 // Now look at filt_high
169 if (filt_direction >= 0 && filt_high != filt_mid) {
170 if (ss_err[filt_high] < 0) {
171 ss_err[filt_high] =
172 try_filter_frame(sd, cpi, filt_high, partial_frame, plane, dir);
173 }
174 // If value is significantly better than previous best, bias added against
175 // raising filter value
176 if (ss_err[filt_high] < (best_err - bias)) {
177 best_err = ss_err[filt_high];
178 filt_best = filt_high;
179 }
180 }
181
182 // Half the step distance if the best filter value was the same as last time
183 if (filt_best == filt_mid) {
184 filter_step /= 2;
185 filt_direction = 0;
186 } else {
187 filt_direction = (filt_best < filt_mid) ? -1 : 1;
188 filt_mid = filt_best;
189 }
190 }
191
192 return filt_best;
193 }
194
av1_pick_filter_level(const YV12_BUFFER_CONFIG * sd,AV1_COMP * cpi,LPF_PICK_METHOD method)195 void av1_pick_filter_level(const YV12_BUFFER_CONFIG *sd, AV1_COMP *cpi,
196 LPF_PICK_METHOD method) {
197 AV1_COMMON *const cm = &cpi->common;
198 const SequenceHeader *const seq_params = cm->seq_params;
199 const int num_planes = av1_num_planes(cm);
200 struct loopfilter *const lf = &cm->lf;
201 int disable_filter_rt_screen = 0;
202 (void)sd;
203
204 lf->sharpness_level = 0;
205
206 if (cpi->oxcf.tune_cfg.content == AOM_CONTENT_SCREEN &&
207 cpi->oxcf.q_cfg.aq_mode == CYCLIC_REFRESH_AQ &&
208 cpi->sf.rt_sf.skip_lf_screen)
209 disable_filter_rt_screen = av1_cyclic_refresh_disable_lf_cdef(cpi);
210
211 if (disable_filter_rt_screen ||
212 cpi->oxcf.algo_cfg.loopfilter_control == LOOPFILTER_NONE ||
213 (cpi->oxcf.algo_cfg.loopfilter_control == LOOPFILTER_REFERENCE &&
214 cpi->ppi->rtc_ref.non_reference_frame)) {
215 lf->filter_level[0] = 0;
216 lf->filter_level[1] = 0;
217 return;
218 }
219
220 if (method == LPF_PICK_MINIMAL_LPF) {
221 lf->filter_level[0] = 0;
222 lf->filter_level[1] = 0;
223 } else if (method >= LPF_PICK_FROM_Q) {
224 const int min_filter_level = 0;
225 const int max_filter_level = av1_get_max_filter_level(cpi);
226 const int q = av1_ac_quant_QTX(cm->quant_params.base_qindex, 0,
227 seq_params->bit_depth);
228 // based on tests result for rtc test set
229 // 0.04590 boosted or 0.02295 non-booseted in 18-bit fixed point
230 const int strength_boost_q_treshold = 0;
231 int inter_frame_multiplier =
232 (q > strength_boost_q_treshold ||
233 (cpi->sf.rt_sf.use_nonrd_pick_mode &&
234 cpi->common.width * cpi->common.height > 352 * 288))
235 ? 12034
236 : 6017;
237 // These values were determined by linear fitting the result of the
238 // searched level for 8 bit depth:
239 // Keyframes: filt_guess = q * 0.06699 - 1.60817
240 // Other frames: filt_guess = q * inter_frame_multiplier + 2.48225
241 //
242 // And high bit depth separately:
243 // filt_guess = q * 0.316206 + 3.87252
244 int filt_guess;
245 switch (seq_params->bit_depth) {
246 case AOM_BITS_8:
247 filt_guess =
248 (cm->current_frame.frame_type == KEY_FRAME)
249 ? ROUND_POWER_OF_TWO(q * 17563 - 421574, 18)
250 : ROUND_POWER_OF_TWO(q * inter_frame_multiplier + 650707, 18);
251 break;
252 case AOM_BITS_10:
253 filt_guess = ROUND_POWER_OF_TWO(q * 20723 + 4060632, 20);
254 break;
255 case AOM_BITS_12:
256 filt_guess = ROUND_POWER_OF_TWO(q * 20723 + 16242526, 22);
257 break;
258 default:
259 assert(0 &&
260 "bit_depth should be AOM_BITS_8, AOM_BITS_10 "
261 "or AOM_BITS_12");
262 return;
263 }
264 if (seq_params->bit_depth != AOM_BITS_8 &&
265 cm->current_frame.frame_type == KEY_FRAME)
266 filt_guess -= 4;
267 // TODO(chengchen): retrain the model for Y, U, V filter levels
268 lf->filter_level[0] = clamp(filt_guess, min_filter_level, max_filter_level);
269 lf->filter_level[1] = clamp(filt_guess, min_filter_level, max_filter_level);
270 lf->filter_level_u = clamp(filt_guess, min_filter_level, max_filter_level);
271 lf->filter_level_v = clamp(filt_guess, min_filter_level, max_filter_level);
272 if (cpi->oxcf.algo_cfg.loopfilter_control == LOOPFILTER_SELECTIVELY &&
273 !frame_is_intra_only(cm) && !cpi->rc.high_source_sad) {
274 if (cpi->oxcf.tune_cfg.content == AOM_CONTENT_SCREEN) {
275 lf->filter_level[0] = 0;
276 lf->filter_level[1] = 0;
277 } else {
278 const int num4x4 = (cm->width >> 2) * (cm->height >> 2);
279 const int newmv_thresh = 7;
280 const int distance_since_key_thresh = 5;
281 if ((cpi->td.rd_counts.newmv_or_intra_blocks * 100 / num4x4) <
282 newmv_thresh &&
283 cpi->rc.frames_since_key > distance_since_key_thresh) {
284 lf->filter_level[0] = 0;
285 lf->filter_level[1] = 0;
286 }
287 }
288 }
289 } else {
290 int last_frame_filter_level[4] = { 0 };
291 if (!frame_is_intra_only(cm)) {
292 last_frame_filter_level[0] = cpi->ppi->filter_level[0];
293 last_frame_filter_level[1] = cpi->ppi->filter_level[1];
294 last_frame_filter_level[2] = cpi->ppi->filter_level_u;
295 last_frame_filter_level[3] = cpi->ppi->filter_level_v;
296 }
297 // The frame buffer last_frame_uf is used to store the non-loop filtered
298 // reconstructed frame in search_filter_level().
299 if (aom_realloc_frame_buffer(
300 &cpi->last_frame_uf, cm->width, cm->height,
301 seq_params->subsampling_x, seq_params->subsampling_y,
302 seq_params->use_highbitdepth, cpi->oxcf.border_in_pixels,
303 cm->features.byte_alignment, NULL, NULL, NULL, 0, 0))
304 aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
305 "Failed to allocate last frame buffer");
306
307 lf->filter_level[0] = lf->filter_level[1] =
308 search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
309 last_frame_filter_level, 0, 2);
310 if (method != LPF_PICK_FROM_FULL_IMAGE_NON_DUAL) {
311 lf->filter_level[0] =
312 search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
313 last_frame_filter_level, 0, 0);
314 lf->filter_level[1] =
315 search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
316 last_frame_filter_level, 0, 1);
317 }
318
319 if (num_planes > 1) {
320 lf->filter_level_u =
321 search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
322 last_frame_filter_level, 1, 0);
323 lf->filter_level_v =
324 search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
325 last_frame_filter_level, 2, 0);
326 }
327 }
328 }
329