1 /*
2 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
3 *
4 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10 */
11
12 #ifndef AOM_AV1_ENCODER_ENCODEMB_H_
13 #define AOM_AV1_ENCODER_ENCODEMB_H_
14
15 #include "config/aom_config.h"
16
17 #include "av1/common/av1_common_int.h"
18 #include "av1/common/txb_common.h"
19 #include "av1/encoder/av1_quantize.h"
20 #include "av1/encoder/block.h"
21 #include "av1/encoder/tokenize.h"
22 #ifdef __cplusplus
23 extern "C" {
24 #endif
25
26 enum {
27 AV1_XFORM_QUANT_FP = 0,
28 AV1_XFORM_QUANT_B = 1,
29 AV1_XFORM_QUANT_DC = 2,
30 AV1_XFORM_QUANT_SKIP_QUANT,
31 AV1_XFORM_QUANT_TYPES,
32 } UENUM1BYTE(AV1_XFORM_QUANT);
33
34 // TODO(any): Merge OPT_TYPe and TRELLLIS_OPT_TYPE
35 // Available optimization types to optimize the quantized coefficients.
36 enum {
37 NONE_OPT = 0, // No optimization.
38 TRELLIS_OPT = 1, // Trellis optimization. See `av1_optimize_b()`.
39 DROPOUT_OPT = 2, // Dropout optimization. See `av1_dropout_qcoeff()`.
40 TRELLIS_DROPOUT_OPT = 3 // Perform dropout after trellis optimization.
41 } UENUM1BYTE(OPT_TYPE);
42
43 enum {
44 NO_TRELLIS_OPT, // No trellis optimization
45 FULL_TRELLIS_OPT, // Trellis optimization in all stages
46 FINAL_PASS_TRELLIS_OPT, // Trellis optimization in only the final encode pass
47 NO_ESTIMATE_YRD_TRELLIS_OPT // Disable trellis in estimate_yrd_for_sb
48 } UENUM1BYTE(TRELLIS_OPT_TYPE);
49
50 struct optimize_ctx {
51 ENTROPY_CONTEXT ta[MAX_MB_PLANE][MAX_MIB_SIZE];
52 ENTROPY_CONTEXT tl[MAX_MB_PLANE][MAX_MIB_SIZE];
53 };
54
55 struct encode_b_args {
56 const struct AV1_COMP *cpi;
57 MACROBLOCK *x;
58 struct optimize_ctx *ctx;
59 int8_t *skip;
60 ENTROPY_CONTEXT *ta;
61 ENTROPY_CONTEXT *tl;
62 RUN_TYPE dry_run;
63 TRELLIS_OPT_TYPE enable_optimize_b;
64 };
65
66 void av1_encode_sb(const struct AV1_COMP *cpi, MACROBLOCK *x, BLOCK_SIZE bsize,
67 RUN_TYPE dry_run);
68
69 void av1_foreach_transformed_block_in_plane(
70 const MACROBLOCKD *const xd, BLOCK_SIZE plane_bsize, int plane,
71 foreach_transformed_block_visitor visit, void *arg);
72
73 void av1_encode_sby_pass1(struct AV1_COMP *cpi, MACROBLOCK *x,
74 BLOCK_SIZE bsize);
75
76 void av1_setup_xform(const AV1_COMMON *cm, MACROBLOCK *x, TX_SIZE tx_size,
77 TX_TYPE tx_type, TxfmParam *txfm_param);
78 void av1_setup_quant(TX_SIZE tx_size, int use_optimize_b, int xform_quant_idx,
79 int use_quant_b_adapt, QUANT_PARAM *qparam);
80 void av1_setup_qmatrix(const CommonQuantParams *quant_params,
81 const MACROBLOCKD *xd, int plane, TX_SIZE tx_size,
82 TX_TYPE tx_type, QUANT_PARAM *qparam);
83
84 void av1_xform_dc_only(MACROBLOCK *x, int plane, int block,
85 TxfmParam *txfm_param, int64_t per_px_mean);
86
87 void av1_xform_quant(MACROBLOCK *x, int plane, int block, int blk_row,
88 int blk_col, BLOCK_SIZE plane_bsize, TxfmParam *txfm_param,
89 QUANT_PARAM *qparam);
90
91 void av1_xform(MACROBLOCK *x, int plane, int block, int blk_row, int blk_col,
92 BLOCK_SIZE plane_bsize, TxfmParam *txfm_param);
93
94 void av1_quant(MACROBLOCK *x, int plane, int block, TxfmParam *txfm_param,
95 QUANT_PARAM *qparam);
96
97 int av1_optimize_b(const struct AV1_COMP *cpi, MACROBLOCK *mb, int plane,
98 int block, TX_SIZE tx_size, TX_TYPE tx_type,
99 const TXB_CTX *const txb_ctx, int *rate_cost);
100
101 // This function can be used as (i) a further optimization to reduce the
102 // redundancy of quantized coefficients (a.k.a., `qcoeff`) after trellis
103 // optimization, or (ii) an alternative to trellis optimization in high-speed
104 // compression mode (e.g., real-time mode under speed-6) due to its LOW time
105 // complexity. The rational behind is to drop out the may-be redundant quantized
106 // coefficient which is among a bunch of zeros. NOTE: This algorithm is not as
107 // accurate as trellis optimization since the hyper-parameters are hard-coded
108 // instead of dynamic search. More adaptive logic may improve the performance.
109 // This function should be applied to all or partical block cells.
110 // Inputs:
111 // mb: Pointer to the MACROBLOCK to perform dropout on.
112 // plane: Index of the plane to which the target block belongs.
113 // block: Index of the target block.
114 // tx_size: Transform size of the target block.
115 // tx_type: Transform type of the target block. This field is particularly
116 // used to find out the scan order of the block.
117 // qindex: Quantization index used for target block. In general, all blocks
118 // in a same plane share the same quantization index. This field is
119 // particularly used to determine how many zeros should be used to
120 // drop out a coefficient.
121 // Returns:
122 // Nothing will be returned, but `qcoeff`, `dqcoeff`, `eob`, as well as
123 // `txb_entropy_ctx`, which `mb` points to, may be modified by this function.
124 void av1_dropout_qcoeff(MACROBLOCK *mb, int plane, int block, TX_SIZE tx_size,
125 TX_TYPE tx_type, int qindex);
126 // Same as above, with the number of zeroes needed before/after a coeff to drop
127 // it explicitly passed in, instead of being derived from qindex.
128 void av1_dropout_qcoeff_num(MACROBLOCK *mb, int plane, int block,
129 TX_SIZE tx_size, TX_TYPE tx_type,
130 int dropout_num_before, int dropout_num_after);
131
132 void av1_subtract_block(BitDepthInfo bd_info, int rows, int cols, int16_t *diff,
133 ptrdiff_t diff_stride, const uint8_t *src8,
134 ptrdiff_t src_stride, const uint8_t *pred8,
135 ptrdiff_t pred_stride);
136
137 void av1_subtract_txb(MACROBLOCK *x, int plane, BLOCK_SIZE plane_bsize,
138 int blk_col, int blk_row, TX_SIZE tx_size);
139
140 void av1_subtract_plane(MACROBLOCK *x, BLOCK_SIZE plane_bsize, int plane);
141
av1_set_txb_context(MACROBLOCK * x,int plane,int block,TX_SIZE tx_size,ENTROPY_CONTEXT * a,ENTROPY_CONTEXT * l)142 static INLINE void av1_set_txb_context(MACROBLOCK *x, int plane, int block,
143 TX_SIZE tx_size, ENTROPY_CONTEXT *a,
144 ENTROPY_CONTEXT *l) {
145 const uint8_t ctx = x->plane[plane].txb_entropy_ctx[block];
146 memset(a, ctx, tx_size_wide_unit[tx_size] * sizeof(*a));
147 memset(l, ctx, tx_size_high_unit[tx_size] * sizeof(*l));
148 }
149
150 void av1_encode_block_intra(int plane, int block, int blk_row, int blk_col,
151 BLOCK_SIZE plane_bsize, TX_SIZE tx_size, void *arg);
152
153 void av1_encode_intra_block_plane(const struct AV1_COMP *cpi, MACROBLOCK *x,
154 BLOCK_SIZE bsize, int plane, RUN_TYPE dry_run,
155 TRELLIS_OPT_TYPE enable_optimize_b);
156
is_trellis_used(TRELLIS_OPT_TYPE optimize_b,RUN_TYPE dry_run)157 static INLINE int is_trellis_used(TRELLIS_OPT_TYPE optimize_b,
158 RUN_TYPE dry_run) {
159 if (optimize_b == NO_TRELLIS_OPT) return false;
160 if (optimize_b == FINAL_PASS_TRELLIS_OPT && dry_run != OUTPUT_ENABLED)
161 return false;
162 return true;
163 }
164
165 // Scaling terms (precision of 12 bits) to perform tx-size specific
166 // normalization that is used in DCT_DCT forward transform.
167 // For transform blocks of 1:2 and 2:1 - sqrt(2) normalization is used
168 // For transform blocks of 1:4 and 4:1 - factor of 2 is used
169 // For transform blocks TX_8x8 and below - an additional factor of 2 is used
170 // For transform blocks max(width,height)=64 - currently not supported
171
172 static const uint16_t dc_coeff_scale[TX_SIZES_ALL] = {
173 1024, 2048, 4096, 4096, 0, 1448, 1448, 2896, 2896, 2896,
174 2896, 0, 0, 2048, 2048, 4096, 4096, 0, 0
175 };
176
177 #ifdef __cplusplus
178 } // extern "C"
179 #endif
180
181 #endif // AOM_AV1_ENCODER_ENCODEMB_H_
182