• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright (c) 2020, Alliance for Open Media. All rights reserved
3  *
4  * This source code is subject to the terms of the BSD 2 Clause License and
5  * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6  * was not distributed with this source code in the LICENSE file, you can
7  * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8  * Media Patent License 1.0 was not distributed with this source code in the
9  * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10  */
11 
12 #include "aom/aomcx.h"
13 
14 #include "av1/encoder/bitstream.h"
15 #include "av1/encoder/encodeframe.h"
16 #include "av1/encoder/encoder.h"
17 #include "av1/encoder/encoder_alloc.h"
18 #include "av1/encoder/encodetxb.h"
19 #include "av1/encoder/encoder_utils.h"
20 #include "av1/encoder/grain_test_vectors.h"
21 #include "av1/encoder/mv_prec.h"
22 #include "av1/encoder/rc_utils.h"
23 #include "av1/encoder/rdopt.h"
24 #include "av1/encoder/segmentation.h"
25 #include "av1/encoder/superres_scale.h"
26 #include "av1/encoder/tpl_model.h"
27 #include "av1/encoder/var_based_part.h"
28 
29 #if CONFIG_TUNE_VMAF
30 #include "av1/encoder/tune_vmaf.h"
31 #endif
32 
33 #define MIN_BOOST_COMBINE_FACTOR 4.0
34 #define MAX_BOOST_COMBINE_FACTOR 12.0
35 
36 const int default_tx_type_probs[FRAME_UPDATE_TYPES][TX_SIZES_ALL][TX_TYPES] = {
37   { { 221, 189, 214, 292, 0, 0, 0, 0, 0, 2, 38, 68, 0, 0, 0, 0 },
38     { 262, 203, 216, 239, 0, 0, 0, 0, 0, 1, 37, 66, 0, 0, 0, 0 },
39     { 315, 231, 239, 226, 0, 0, 0, 0, 0, 13, 0, 0, 0, 0, 0, 0 },
40     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
41     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
42     { 222, 188, 214, 287, 0, 0, 0, 0, 0, 2, 50, 61, 0, 0, 0, 0 },
43     { 256, 182, 205, 282, 0, 0, 0, 0, 0, 2, 21, 76, 0, 0, 0, 0 },
44     { 281, 214, 217, 222, 0, 0, 0, 0, 0, 1, 48, 41, 0, 0, 0, 0 },
45     { 263, 194, 225, 225, 0, 0, 0, 0, 0, 2, 15, 100, 0, 0, 0, 0 },
46     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
47     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
48     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
49     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
50     { 170, 192, 242, 293, 0, 0, 0, 0, 0, 1, 68, 58, 0, 0, 0, 0 },
51     { 199, 210, 213, 291, 0, 0, 0, 0, 0, 1, 14, 96, 0, 0, 0, 0 },
52     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
53     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
54     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
55     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
56   { { 106, 69, 107, 278, 9, 15, 20, 45, 49, 23, 23, 88, 36, 74, 25, 57 },
57     { 105, 72, 81, 98, 45, 49, 47, 50, 56, 72, 30, 81, 33, 95, 27, 83 },
58     { 211, 105, 109, 120, 57, 62, 43, 49, 52, 58, 42, 116, 0, 0, 0, 0 },
59     { 1008, 0, 0, 0, 0, 0, 0, 0, 0, 16, 0, 0, 0, 0, 0, 0 },
60     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
61     { 131, 57, 98, 172, 19, 40, 37, 64, 69, 22, 41, 52, 51, 77, 35, 59 },
62     { 176, 83, 93, 202, 22, 24, 28, 47, 50, 16, 12, 93, 26, 76, 17, 59 },
63     { 136, 72, 89, 95, 46, 59, 47, 56, 61, 68, 35, 51, 32, 82, 26, 69 },
64     { 122, 80, 87, 105, 49, 47, 46, 46, 57, 52, 13, 90, 19, 103, 15, 93 },
65     { 1009, 0, 0, 0, 0, 0, 0, 0, 0, 15, 0, 0, 0, 0, 0, 0 },
66     { 1011, 0, 0, 0, 0, 0, 0, 0, 0, 13, 0, 0, 0, 0, 0, 0 },
67     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
68     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
69     { 202, 20, 84, 114, 14, 60, 41, 79, 99, 21, 41, 15, 50, 84, 34, 66 },
70     { 196, 44, 23, 72, 30, 22, 28, 57, 67, 13, 4, 165, 15, 148, 9, 131 },
71     { 882, 0, 0, 0, 0, 0, 0, 0, 0, 142, 0, 0, 0, 0, 0, 0 },
72     { 840, 0, 0, 0, 0, 0, 0, 0, 0, 184, 0, 0, 0, 0, 0, 0 },
73     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
74     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
75   { { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
76     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
77     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
78     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
79     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
80     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
81     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
82     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
83     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
84     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
85     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
86     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
87     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
88     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
89     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
90     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
91     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
92     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
93     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 } },
94   { { 213, 110, 141, 269, 12, 16, 15, 19, 21, 11, 38, 68, 22, 29, 16, 24 },
95     { 216, 119, 128, 143, 38, 41, 26, 30, 31, 30, 42, 70, 23, 36, 19, 32 },
96     { 367, 149, 154, 154, 38, 35, 17, 21, 21, 10, 22, 36, 0, 0, 0, 0 },
97     { 1022, 0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0 },
98     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
99     { 219, 96, 127, 191, 21, 40, 25, 32, 34, 18, 45, 45, 33, 39, 26, 33 },
100     { 296, 99, 122, 198, 23, 21, 19, 24, 25, 13, 20, 64, 23, 32, 18, 27 },
101     { 275, 128, 142, 143, 35, 48, 23, 30, 29, 18, 42, 36, 18, 23, 14, 20 },
102     { 239, 132, 166, 175, 36, 27, 19, 21, 24, 14, 13, 85, 9, 31, 8, 25 },
103     { 1022, 0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0 },
104     { 1022, 0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0 },
105     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
106     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
107     { 309, 25, 79, 59, 25, 80, 34, 53, 61, 25, 49, 23, 43, 64, 36, 59 },
108     { 270, 57, 40, 54, 50, 42, 41, 53, 56, 28, 17, 81, 45, 86, 34, 70 },
109     { 1005, 0, 0, 0, 0, 0, 0, 0, 0, 19, 0, 0, 0, 0, 0, 0 },
110     { 992, 0, 0, 0, 0, 0, 0, 0, 0, 32, 0, 0, 0, 0, 0, 0 },
111     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
112     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
113   { { 133, 63, 55, 83, 57, 87, 58, 72, 68, 16, 24, 35, 29, 105, 25, 114 },
114     { 131, 75, 74, 60, 71, 77, 65, 66, 73, 33, 21, 79, 20, 83, 18, 78 },
115     { 276, 95, 82, 58, 86, 93, 63, 60, 64, 17, 38, 92, 0, 0, 0, 0 },
116     { 1006, 0, 0, 0, 0, 0, 0, 0, 0, 18, 0, 0, 0, 0, 0, 0 },
117     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
118     { 147, 49, 75, 78, 50, 97, 60, 67, 76, 17, 42, 35, 31, 93, 27, 80 },
119     { 157, 49, 58, 75, 61, 52, 56, 67, 69, 12, 15, 79, 24, 119, 11, 120 },
120     { 178, 69, 83, 77, 69, 85, 72, 77, 77, 20, 35, 40, 25, 48, 23, 46 },
121     { 174, 55, 64, 57, 73, 68, 62, 61, 75, 15, 12, 90, 17, 99, 16, 86 },
122     { 1008, 0, 0, 0, 0, 0, 0, 0, 0, 16, 0, 0, 0, 0, 0, 0 },
123     { 1018, 0, 0, 0, 0, 0, 0, 0, 0, 6, 0, 0, 0, 0, 0, 0 },
124     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
125     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
126     { 266, 31, 63, 64, 21, 52, 39, 54, 63, 30, 52, 31, 48, 89, 46, 75 },
127     { 272, 26, 32, 44, 29, 31, 32, 53, 51, 13, 13, 88, 22, 153, 16, 149 },
128     { 923, 0, 0, 0, 0, 0, 0, 0, 0, 101, 0, 0, 0, 0, 0, 0 },
129     { 969, 0, 0, 0, 0, 0, 0, 0, 0, 55, 0, 0, 0, 0, 0, 0 },
130     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
131     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
132   { { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
133     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
134     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
135     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
136     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
137     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
138     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
139     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
140     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
141     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
142     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
143     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
144     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
145     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
146     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
147     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
148     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
149     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
150     { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 } },
151   { { 158, 92, 125, 298, 12, 15, 20, 29, 31, 12, 29, 67, 34, 44, 23, 35 },
152     { 147, 94, 103, 123, 45, 48, 38, 41, 46, 48, 37, 78, 33, 63, 27, 53 },
153     { 268, 126, 125, 136, 54, 53, 31, 38, 38, 33, 35, 87, 0, 0, 0, 0 },
154     { 1018, 0, 0, 0, 0, 0, 0, 0, 0, 6, 0, 0, 0, 0, 0, 0 },
155     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
156     { 159, 72, 103, 194, 20, 35, 37, 50, 56, 21, 39, 40, 51, 61, 38, 48 },
157     { 259, 86, 95, 188, 32, 20, 25, 34, 37, 13, 12, 85, 25, 53, 17, 43 },
158     { 189, 99, 113, 123, 45, 59, 37, 46, 48, 44, 39, 41, 31, 47, 26, 37 },
159     { 175, 110, 113, 128, 58, 38, 33, 33, 43, 29, 13, 100, 14, 68, 12, 57 },
160     { 1017, 0, 0, 0, 0, 0, 0, 0, 0, 7, 0, 0, 0, 0, 0, 0 },
161     { 1019, 0, 0, 0, 0, 0, 0, 0, 0, 5, 0, 0, 0, 0, 0, 0 },
162     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
163     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
164     { 208, 22, 84, 101, 21, 59, 44, 70, 90, 25, 59, 13, 64, 67, 49, 48 },
165     { 277, 52, 32, 63, 43, 26, 33, 48, 54, 11, 6, 130, 18, 119, 11, 101 },
166     { 963, 0, 0, 0, 0, 0, 0, 0, 0, 61, 0, 0, 0, 0, 0, 0 },
167     { 979, 0, 0, 0, 0, 0, 0, 0, 0, 45, 0, 0, 0, 0, 0, 0 },
168     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
169     { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } }
170 };
171 
172 const int default_obmc_probs[FRAME_UPDATE_TYPES][BLOCK_SIZES_ALL] = {
173   { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
174   { 0,  0,  0,  106, 90, 90, 97, 67, 59, 70, 28,
175     30, 38, 16, 16,  16, 0,  0,  44, 50, 26, 25 },
176   { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
177   { 0,  0,  0,  98, 93, 97, 68, 82, 85, 33, 30,
178     33, 16, 16, 16, 16, 0,  0,  43, 37, 26, 16 },
179   { 0,  0,  0,  91, 80, 76, 78, 55, 49, 24, 16,
180     16, 16, 16, 16, 16, 0,  0,  29, 45, 16, 38 },
181   { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
182   { 0,  0,  0,  103, 89, 89, 89, 62, 63, 76, 34,
183     35, 32, 19, 16,  16, 0,  0,  49, 55, 29, 19 }
184 };
185 
186 const int default_warped_probs[FRAME_UPDATE_TYPES] = { 64, 64, 64, 64,
187                                                        64, 64, 64 };
188 
189 // TODO(yunqing): the default probs can be trained later from better
190 // performance.
191 const int default_switchable_interp_probs[FRAME_UPDATE_TYPES]
192                                          [SWITCHABLE_FILTER_CONTEXTS]
193                                          [SWITCHABLE_FILTERS] = {
194                                            { { 512, 512, 512 },
195                                              { 512, 512, 512 },
196                                              { 512, 512, 512 },
197                                              { 512, 512, 512 },
198                                              { 512, 512, 512 },
199                                              { 512, 512, 512 },
200                                              { 512, 512, 512 },
201                                              { 512, 512, 512 },
202                                              { 512, 512, 512 },
203                                              { 512, 512, 512 },
204                                              { 512, 512, 512 },
205                                              { 512, 512, 512 },
206                                              { 512, 512, 512 },
207                                              { 512, 512, 512 },
208                                              { 512, 512, 512 },
209                                              { 512, 512, 512 } },
210                                            { { 512, 512, 512 },
211                                              { 512, 512, 512 },
212                                              { 512, 512, 512 },
213                                              { 512, 512, 512 },
214                                              { 512, 512, 512 },
215                                              { 512, 512, 512 },
216                                              { 512, 512, 512 },
217                                              { 512, 512, 512 },
218                                              { 512, 512, 512 },
219                                              { 512, 512, 512 },
220                                              { 512, 512, 512 },
221                                              { 512, 512, 512 },
222                                              { 512, 512, 512 },
223                                              { 512, 512, 512 },
224                                              { 512, 512, 512 },
225                                              { 512, 512, 512 } },
226                                            { { 512, 512, 512 },
227                                              { 512, 512, 512 },
228                                              { 512, 512, 512 },
229                                              { 512, 512, 512 },
230                                              { 512, 512, 512 },
231                                              { 512, 512, 512 },
232                                              { 512, 512, 512 },
233                                              { 512, 512, 512 },
234                                              { 512, 512, 512 },
235                                              { 512, 512, 512 },
236                                              { 512, 512, 512 },
237                                              { 512, 512, 512 },
238                                              { 512, 512, 512 },
239                                              { 512, 512, 512 },
240                                              { 512, 512, 512 },
241                                              { 512, 512, 512 } },
242                                            { { 512, 512, 512 },
243                                              { 512, 512, 512 },
244                                              { 512, 512, 512 },
245                                              { 512, 512, 512 },
246                                              { 512, 512, 512 },
247                                              { 512, 512, 512 },
248                                              { 512, 512, 512 },
249                                              { 512, 512, 512 },
250                                              { 512, 512, 512 },
251                                              { 512, 512, 512 },
252                                              { 512, 512, 512 },
253                                              { 512, 512, 512 },
254                                              { 512, 512, 512 },
255                                              { 512, 512, 512 },
256                                              { 512, 512, 512 },
257                                              { 512, 512, 512 } },
258                                            { { 512, 512, 512 },
259                                              { 512, 512, 512 },
260                                              { 512, 512, 512 },
261                                              { 512, 512, 512 },
262                                              { 512, 512, 512 },
263                                              { 512, 512, 512 },
264                                              { 512, 512, 512 },
265                                              { 512, 512, 512 },
266                                              { 512, 512, 512 },
267                                              { 512, 512, 512 },
268                                              { 512, 512, 512 },
269                                              { 512, 512, 512 },
270                                              { 512, 512, 512 },
271                                              { 512, 512, 512 },
272                                              { 512, 512, 512 },
273                                              { 512, 512, 512 } },
274                                            { { 512, 512, 512 },
275                                              { 512, 512, 512 },
276                                              { 512, 512, 512 },
277                                              { 512, 512, 512 },
278                                              { 512, 512, 512 },
279                                              { 512, 512, 512 },
280                                              { 512, 512, 512 },
281                                              { 512, 512, 512 },
282                                              { 512, 512, 512 },
283                                              { 512, 512, 512 },
284                                              { 512, 512, 512 },
285                                              { 512, 512, 512 },
286                                              { 512, 512, 512 },
287                                              { 512, 512, 512 },
288                                              { 512, 512, 512 },
289                                              { 512, 512, 512 } },
290                                            { { 512, 512, 512 },
291                                              { 512, 512, 512 },
292                                              { 512, 512, 512 },
293                                              { 512, 512, 512 },
294                                              { 512, 512, 512 },
295                                              { 512, 512, 512 },
296                                              { 512, 512, 512 },
297                                              { 512, 512, 512 },
298                                              { 512, 512, 512 },
299                                              { 512, 512, 512 },
300                                              { 512, 512, 512 },
301                                              { 512, 512, 512 },
302                                              { 512, 512, 512 },
303                                              { 512, 512, 512 },
304                                              { 512, 512, 512 },
305                                              { 512, 512, 512 } }
306                                          };
307 
configure_static_seg_features(AV1_COMP * cpi)308 static void configure_static_seg_features(AV1_COMP *cpi) {
309   AV1_COMMON *const cm = &cpi->common;
310   const RATE_CONTROL *const rc = &cpi->rc;
311   struct segmentation *const seg = &cm->seg;
312 
313   double avg_q = cpi->ppi->p_rc.avg_q;
314   int high_q = (int)(avg_q > 48.0);
315   int qi_delta;
316 
317   // Disable and clear down for KF
318   if (cm->current_frame.frame_type == KEY_FRAME) {
319     // Clear down the global segmentation map
320     memset(cpi->enc_seg.map, 0, cm->mi_params.mi_rows * cm->mi_params.mi_cols);
321     seg->update_map = 0;
322     seg->update_data = 0;
323 
324     // Disable segmentation
325     av1_disable_segmentation(seg);
326 
327     // Clear down the segment features.
328     av1_clearall_segfeatures(seg);
329   } else if (cpi->refresh_frame.alt_ref_frame) {
330     // If this is an alt ref frame
331     // Clear down the global segmentation map
332     memset(cpi->enc_seg.map, 0, cm->mi_params.mi_rows * cm->mi_params.mi_cols);
333     seg->update_map = 0;
334     seg->update_data = 0;
335 
336     // Disable segmentation and individual segment features by default
337     av1_disable_segmentation(seg);
338     av1_clearall_segfeatures(seg);
339 
340     // If segmentation was enabled set those features needed for the
341     // arf itself.
342     if (seg->enabled) {
343       seg->update_map = 1;
344       seg->update_data = 1;
345 
346       qi_delta = av1_compute_qdelta(rc, avg_q, avg_q * 0.875,
347                                     cm->seq_params->bit_depth);
348       av1_set_segdata(seg, 1, SEG_LVL_ALT_Q, qi_delta - 2);
349       av1_set_segdata(seg, 1, SEG_LVL_ALT_LF_Y_H, -2);
350       av1_set_segdata(seg, 1, SEG_LVL_ALT_LF_Y_V, -2);
351       av1_set_segdata(seg, 1, SEG_LVL_ALT_LF_U, -2);
352       av1_set_segdata(seg, 1, SEG_LVL_ALT_LF_V, -2);
353 
354       av1_enable_segfeature(seg, 1, SEG_LVL_ALT_LF_Y_H);
355       av1_enable_segfeature(seg, 1, SEG_LVL_ALT_LF_Y_V);
356       av1_enable_segfeature(seg, 1, SEG_LVL_ALT_LF_U);
357       av1_enable_segfeature(seg, 1, SEG_LVL_ALT_LF_V);
358 
359       av1_enable_segfeature(seg, 1, SEG_LVL_ALT_Q);
360     }
361   } else if (seg->enabled) {
362     // All other frames if segmentation has been enabled
363 
364     // First normal frame in a valid gf or alt ref group
365     if (rc->frames_since_golden == 0) {
366       // Set up segment features for normal frames in an arf group
367       // Disable segmentation and clear down features if alt ref
368       // is not active for this group
369 
370       av1_disable_segmentation(seg);
371 
372       memset(cpi->enc_seg.map, 0,
373              cm->mi_params.mi_rows * cm->mi_params.mi_cols);
374 
375       seg->update_map = 0;
376       seg->update_data = 0;
377 
378       av1_clearall_segfeatures(seg);
379     } else if (rc->is_src_frame_alt_ref) {
380       // Special case where we are coding over the top of a previous
381       // alt ref frame.
382       // Segment coding disabled for compred testing
383 
384       // Enable ref frame features for segment 0 as well
385       av1_enable_segfeature(seg, 0, SEG_LVL_REF_FRAME);
386       av1_enable_segfeature(seg, 1, SEG_LVL_REF_FRAME);
387 
388       // All mbs should use ALTREF_FRAME
389       av1_clear_segdata(seg, 0, SEG_LVL_REF_FRAME);
390       av1_set_segdata(seg, 0, SEG_LVL_REF_FRAME, ALTREF_FRAME);
391       av1_clear_segdata(seg, 1, SEG_LVL_REF_FRAME);
392       av1_set_segdata(seg, 1, SEG_LVL_REF_FRAME, ALTREF_FRAME);
393 
394       // Skip all MBs if high Q (0,0 mv and skip coeffs)
395       if (high_q) {
396         av1_enable_segfeature(seg, 0, SEG_LVL_SKIP);
397         av1_enable_segfeature(seg, 1, SEG_LVL_SKIP);
398       }
399       // Enable data update
400       seg->update_data = 1;
401     } else {
402       // All other frames.
403 
404       // No updates.. leave things as they are.
405       seg->update_map = 0;
406       seg->update_data = 0;
407     }
408   }
409 }
410 
av1_apply_active_map(AV1_COMP * cpi)411 void av1_apply_active_map(AV1_COMP *cpi) {
412   struct segmentation *const seg = &cpi->common.seg;
413   unsigned char *const seg_map = cpi->enc_seg.map;
414   const unsigned char *const active_map = cpi->active_map.map;
415   int i;
416 
417   assert(AM_SEGMENT_ID_ACTIVE == CR_SEGMENT_ID_BASE);
418 
419   if (frame_is_intra_only(&cpi->common)) {
420     cpi->active_map.enabled = 0;
421     cpi->active_map.update = 1;
422   }
423 
424   if (cpi->active_map.update) {
425     if (cpi->active_map.enabled) {
426       for (i = 0;
427            i < cpi->common.mi_params.mi_rows * cpi->common.mi_params.mi_cols;
428            ++i)
429         if (seg_map[i] == AM_SEGMENT_ID_ACTIVE) seg_map[i] = active_map[i];
430       av1_enable_segmentation(seg);
431       av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_SKIP);
432       av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_H);
433       av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_V);
434       av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_U);
435       av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_V);
436 
437       av1_set_segdata(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_H,
438                       -MAX_LOOP_FILTER);
439       av1_set_segdata(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_V,
440                       -MAX_LOOP_FILTER);
441       av1_set_segdata(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_U,
442                       -MAX_LOOP_FILTER);
443       av1_set_segdata(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_V,
444                       -MAX_LOOP_FILTER);
445     } else {
446       av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_SKIP);
447       av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_H);
448       av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_V);
449       av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_U);
450       av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_V);
451       if (seg->enabled) {
452         seg->update_data = 1;
453         seg->update_map = 1;
454       }
455     }
456     cpi->active_map.update = 0;
457   }
458 }
459 
460 #if !CONFIG_REALTIME_ONLY
process_tpl_stats_frame(AV1_COMP * cpi)461 static void process_tpl_stats_frame(AV1_COMP *cpi) {
462   const GF_GROUP *const gf_group = &cpi->ppi->gf_group;
463   AV1_COMMON *const cm = &cpi->common;
464 
465   assert(IMPLIES(gf_group->size > 0, cpi->gf_frame_index < gf_group->size));
466 
467   const int tpl_idx = cpi->gf_frame_index;
468   TplParams *const tpl_data = &cpi->ppi->tpl_data;
469   TplDepFrame *tpl_frame = &tpl_data->tpl_frame[tpl_idx];
470   TplDepStats *tpl_stats = tpl_frame->tpl_stats_ptr;
471 
472   if (tpl_frame->is_valid) {
473     int tpl_stride = tpl_frame->stride;
474     int64_t intra_cost_base = 0;
475     int64_t mc_dep_cost_base = 0;
476     const int step = 1 << tpl_data->tpl_stats_block_mis_log2;
477     const int row_step = step;
478     const int col_step_sr =
479         coded_to_superres_mi(step, cm->superres_scale_denominator);
480     const int mi_cols_sr = av1_pixels_to_mi(cm->superres_upscaled_width);
481 
482     for (int row = 0; row < cm->mi_params.mi_rows; row += row_step) {
483       for (int col = 0; col < mi_cols_sr; col += col_step_sr) {
484         TplDepStats *this_stats = &tpl_stats[av1_tpl_ptr_pos(
485             row, col, tpl_stride, tpl_data->tpl_stats_block_mis_log2)];
486         int64_t mc_dep_delta =
487             RDCOST(tpl_frame->base_rdmult, this_stats->mc_dep_rate,
488                    this_stats->mc_dep_dist);
489         intra_cost_base += (this_stats->recrf_dist << RDDIV_BITS);
490         mc_dep_cost_base +=
491             (this_stats->recrf_dist << RDDIV_BITS) + mc_dep_delta;
492       }
493     }
494 
495     if (mc_dep_cost_base == 0) {
496       tpl_frame->is_valid = 0;
497     } else {
498       cpi->rd.r0 = (double)intra_cost_base / mc_dep_cost_base;
499       if (is_frame_tpl_eligible(gf_group, cpi->gf_frame_index)) {
500         if (cpi->ppi->lap_enabled) {
501           double min_boost_factor = sqrt(cpi->ppi->p_rc.baseline_gf_interval);
502           const int gfu_boost = get_gfu_boost_from_r0_lap(
503               min_boost_factor, MAX_GFUBOOST_FACTOR, cpi->rd.r0,
504               cpi->ppi->p_rc.num_stats_required_for_gfu_boost);
505           // printf("old boost %d new boost %d\n", cpi->rc.gfu_boost,
506           //        gfu_boost);
507           cpi->ppi->p_rc.gfu_boost = combine_prior_with_tpl_boost(
508               min_boost_factor, MAX_BOOST_COMBINE_FACTOR,
509               cpi->ppi->p_rc.gfu_boost, gfu_boost,
510               cpi->ppi->p_rc.num_stats_used_for_gfu_boost);
511         } else {
512           const int gfu_boost = (int)(200.0 / cpi->rd.r0);
513           cpi->ppi->p_rc.gfu_boost = combine_prior_with_tpl_boost(
514               MIN_BOOST_COMBINE_FACTOR, MAX_BOOST_COMBINE_FACTOR,
515               cpi->ppi->p_rc.gfu_boost, gfu_boost, cpi->rc.frames_to_key);
516         }
517       }
518     }
519   }
520 }
521 #endif  // !CONFIG_REALTIME_ONLY
522 
av1_set_size_dependent_vars(AV1_COMP * cpi,int * q,int * bottom_index,int * top_index)523 void av1_set_size_dependent_vars(AV1_COMP *cpi, int *q, int *bottom_index,
524                                  int *top_index) {
525   AV1_COMMON *const cm = &cpi->common;
526 
527   // Setup variables that depend on the dimensions of the frame.
528   av1_set_speed_features_framesize_dependent(cpi, cpi->speed);
529 
530 #if !CONFIG_REALTIME_ONLY
531   GF_GROUP *gf_group = &cpi->ppi->gf_group;
532   if (cpi->oxcf.algo_cfg.enable_tpl_model &&
533       is_frame_tpl_eligible(gf_group, cpi->gf_frame_index)) {
534     process_tpl_stats_frame(cpi);
535     av1_tpl_rdmult_setup(cpi);
536   }
537 #endif
538 
539   // Decide q and q bounds.
540   *q = av1_rc_pick_q_and_bounds(cpi, cm->width, cm->height, cpi->gf_frame_index,
541                                 bottom_index, top_index);
542 
543 #if !CONFIG_REALTIME_ONLY
544   if (cpi->oxcf.rc_cfg.mode == AOM_Q &&
545       cpi->ppi->tpl_data.tpl_frame[cpi->gf_frame_index].is_valid &&
546       is_frame_tpl_eligible(gf_group, cpi->gf_frame_index) &&
547       !is_lossless_requested(&cpi->oxcf.rc_cfg) && !frame_is_intra_only(cm)) {
548     *q = av1_tpl_get_q_index(&cpi->ppi->tpl_data, cpi->gf_frame_index,
549                              cpi->rc.active_worst_quality,
550                              cm->seq_params->bit_depth);
551     *top_index = *bottom_index = *q;
552     if (gf_group->update_type[cpi->gf_frame_index] == ARF_UPDATE)
553       cpi->ppi->p_rc.arf_q = *q;
554   }
555 
556   if (cpi->oxcf.q_cfg.use_fixed_qp_offsets && cpi->oxcf.rc_cfg.mode == AOM_Q) {
557     if (is_frame_tpl_eligible(gf_group, cpi->gf_frame_index)) {
558       const double qratio_grad =
559           cpi->ppi->p_rc.baseline_gf_interval > 20 ? 0.2 : 0.3;
560       const double qstep_ratio =
561           0.2 +
562           (1.0 - (double)cpi->rc.active_worst_quality / MAXQ) * qratio_grad;
563       *q = av1_get_q_index_from_qstep_ratio(
564           cpi->rc.active_worst_quality, qstep_ratio, cm->seq_params->bit_depth);
565       *top_index = *bottom_index = *q;
566       if (gf_group->update_type[cpi->gf_frame_index] == ARF_UPDATE ||
567           gf_group->update_type[cpi->gf_frame_index] == KF_UPDATE ||
568           gf_group->update_type[cpi->gf_frame_index] == GF_UPDATE)
569         cpi->ppi->p_rc.arf_q = *q;
570     } else if (gf_group->layer_depth[cpi->gf_frame_index] <
571                gf_group->max_layer_depth) {
572       int this_height = gf_group->layer_depth[cpi->gf_frame_index];
573       int arf_q = cpi->ppi->p_rc.arf_q;
574       while (this_height > 1) {
575         arf_q = (arf_q + cpi->oxcf.rc_cfg.cq_level + 1) / 2;
576         --this_height;
577       }
578       *top_index = *bottom_index = *q = arf_q;
579     }
580   }
581 #endif
582 
583   // Configure experimental use of segmentation for enhanced coding of
584   // static regions if indicated.
585   // Only allowed in the second pass of a two pass encode, as it requires
586   // lagged coding, and if the relevant speed feature flag is set.
587   if (is_stat_consumption_stage_twopass(cpi) &&
588       cpi->sf.hl_sf.static_segmentation)
589     configure_static_seg_features(cpi);
590 }
591 
reset_film_grain_chroma_params(aom_film_grain_t * pars)592 static void reset_film_grain_chroma_params(aom_film_grain_t *pars) {
593   pars->num_cr_points = 0;
594   pars->cr_mult = 0;
595   pars->cr_luma_mult = 0;
596   memset(pars->scaling_points_cr, 0, sizeof(pars->scaling_points_cr));
597   memset(pars->ar_coeffs_cr, 0, sizeof(pars->ar_coeffs_cr));
598   pars->num_cb_points = 0;
599   pars->cb_mult = 0;
600   pars->cb_luma_mult = 0;
601   pars->chroma_scaling_from_luma = 0;
602   memset(pars->scaling_points_cb, 0, sizeof(pars->scaling_points_cb));
603   memset(pars->ar_coeffs_cb, 0, sizeof(pars->ar_coeffs_cb));
604 }
605 
av1_update_film_grain_parameters_seq(struct AV1_PRIMARY * ppi,const AV1EncoderConfig * oxcf)606 void av1_update_film_grain_parameters_seq(struct AV1_PRIMARY *ppi,
607                                           const AV1EncoderConfig *oxcf) {
608   SequenceHeader *const seq_params = &ppi->seq_params;
609   const TuneCfg *const tune_cfg = &oxcf->tune_cfg;
610 
611   if (tune_cfg->film_grain_test_vector || tune_cfg->film_grain_table_filename ||
612       tune_cfg->content == AOM_CONTENT_FILM) {
613     seq_params->film_grain_params_present = 1;
614   } else {
615 #if CONFIG_DENOISE
616     seq_params->film_grain_params_present = (oxcf->noise_level > 0);
617 #else
618     seq_params->film_grain_params_present = 0;
619 #endif
620   }
621 }
622 
av1_update_film_grain_parameters(struct AV1_COMP * cpi,const AV1EncoderConfig * oxcf)623 void av1_update_film_grain_parameters(struct AV1_COMP *cpi,
624                                       const AV1EncoderConfig *oxcf) {
625   AV1_COMMON *const cm = &cpi->common;
626   cpi->oxcf = *oxcf;
627   const TuneCfg *const tune_cfg = &oxcf->tune_cfg;
628 
629   if (cpi->film_grain_table) {
630     aom_film_grain_table_free(cpi->film_grain_table);
631     aom_free(cpi->film_grain_table);
632     cpi->film_grain_table = NULL;
633   }
634 
635   if (tune_cfg->film_grain_test_vector) {
636     if (cm->current_frame.frame_type == KEY_FRAME) {
637       memcpy(&cm->film_grain_params,
638              film_grain_test_vectors + tune_cfg->film_grain_test_vector - 1,
639              sizeof(cm->film_grain_params));
640       if (oxcf->tool_cfg.enable_monochrome)
641         reset_film_grain_chroma_params(&cm->film_grain_params);
642       cm->film_grain_params.bit_depth = cm->seq_params->bit_depth;
643       if (cm->seq_params->color_range == AOM_CR_FULL_RANGE) {
644         cm->film_grain_params.clip_to_restricted_range = 0;
645       }
646     }
647   } else if (tune_cfg->film_grain_table_filename) {
648     cpi->film_grain_table = aom_malloc(sizeof(*cpi->film_grain_table));
649     memset(cpi->film_grain_table, 0, sizeof(aom_film_grain_table_t));
650 
651     aom_film_grain_table_read(cpi->film_grain_table,
652                               tune_cfg->film_grain_table_filename, cm->error);
653   } else if (tune_cfg->content == AOM_CONTENT_FILM) {
654     cm->film_grain_params.bit_depth = cm->seq_params->bit_depth;
655     if (oxcf->tool_cfg.enable_monochrome)
656       reset_film_grain_chroma_params(&cm->film_grain_params);
657     if (cm->seq_params->color_range == AOM_CR_FULL_RANGE)
658       cm->film_grain_params.clip_to_restricted_range = 0;
659   } else {
660     memset(&cm->film_grain_params, 0, sizeof(cm->film_grain_params));
661   }
662 }
663 
av1_scale_references(AV1_COMP * cpi,const InterpFilter filter,const int phase,const int use_optimized_scaler)664 void av1_scale_references(AV1_COMP *cpi, const InterpFilter filter,
665                           const int phase, const int use_optimized_scaler) {
666   AV1_COMMON *cm = &cpi->common;
667   const int num_planes = av1_num_planes(cm);
668   MV_REFERENCE_FRAME ref_frame;
669 
670   for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) {
671     // Need to convert from AOM_REFFRAME to index into ref_mask (subtract 1).
672     if (cpi->ref_frame_flags & av1_ref_frame_flag_list[ref_frame]) {
673       BufferPool *const pool = cm->buffer_pool;
674       const YV12_BUFFER_CONFIG *const ref =
675           get_ref_frame_yv12_buf(cm, ref_frame);
676 
677       if (ref == NULL) {
678         cpi->scaled_ref_buf[ref_frame - 1] = NULL;
679         continue;
680       }
681 
682       if (ref->y_crop_width != cm->width || ref->y_crop_height != cm->height) {
683         // Replace the reference buffer with a copy having a thicker border,
684         // if the reference buffer is higher resolution than the current
685         // frame, and the border is thin.
686         if ((ref->y_crop_width > cm->width ||
687              ref->y_crop_height > cm->height) &&
688             ref->border < AOM_BORDER_IN_PIXELS) {
689           RefCntBuffer *ref_fb = get_ref_frame_buf(cm, ref_frame);
690           if (aom_yv12_realloc_with_new_border(
691                   &ref_fb->buf, AOM_BORDER_IN_PIXELS,
692                   cm->features.byte_alignment, num_planes) != 0) {
693             aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
694                                "Failed to allocate frame buffer");
695           }
696         }
697         int force_scaling = 0;
698         RefCntBuffer *new_fb = cpi->scaled_ref_buf[ref_frame - 1];
699         if (new_fb == NULL) {
700           const int new_fb_idx = get_free_fb(cm);
701           if (new_fb_idx == INVALID_IDX) {
702             aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
703                                "Unable to find free frame buffer");
704           }
705           force_scaling = 1;
706           new_fb = &pool->frame_bufs[new_fb_idx];
707         }
708 
709         if (force_scaling || new_fb->buf.y_crop_width != cm->width ||
710             new_fb->buf.y_crop_height != cm->height) {
711           if (aom_realloc_frame_buffer(
712                   &new_fb->buf, cm->width, cm->height,
713                   cm->seq_params->subsampling_x, cm->seq_params->subsampling_y,
714                   cm->seq_params->use_highbitdepth, AOM_BORDER_IN_PIXELS,
715                   cm->features.byte_alignment, NULL, NULL, NULL, 0)) {
716             if (force_scaling) {
717               // Release the reference acquired in the get_free_fb() call above.
718               --new_fb->ref_count;
719             }
720             aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
721                                "Failed to allocate frame buffer");
722           }
723 #if CONFIG_AV1_HIGHBITDEPTH
724           if (use_optimized_scaler && cm->seq_params->bit_depth == AOM_BITS_8)
725             av1_resize_and_extend_frame(ref, &new_fb->buf, filter, phase,
726                                         num_planes);
727           else
728             av1_resize_and_extend_frame_nonnormative(
729                 ref, &new_fb->buf, (int)cm->seq_params->bit_depth, num_planes);
730 #else
731           if (use_optimized_scaler)
732             av1_resize_and_extend_frame(ref, &new_fb->buf, filter, phase,
733                                         num_planes);
734           else
735             av1_resize_and_extend_frame_nonnormative(
736                 ref, &new_fb->buf, (int)cm->seq_params->bit_depth, num_planes);
737 #endif
738           cpi->scaled_ref_buf[ref_frame - 1] = new_fb;
739           alloc_frame_mvs(cm, new_fb);
740         }
741       } else {
742         RefCntBuffer *buf = get_ref_frame_buf(cm, ref_frame);
743         buf->buf.y_crop_width = ref->y_crop_width;
744         buf->buf.y_crop_height = ref->y_crop_height;
745         cpi->scaled_ref_buf[ref_frame - 1] = buf;
746         ++buf->ref_count;
747       }
748     } else {
749       if (!has_no_stats_stage(cpi)) cpi->scaled_ref_buf[ref_frame - 1] = NULL;
750     }
751   }
752 }
753 
av1_select_sb_size(const AV1EncoderConfig * const oxcf,int width,int height,int number_spatial_layers)754 BLOCK_SIZE av1_select_sb_size(const AV1EncoderConfig *const oxcf, int width,
755                               int height, int number_spatial_layers) {
756   if (oxcf->tool_cfg.superblock_size == AOM_SUPERBLOCK_SIZE_64X64)
757     return BLOCK_64X64;
758   if (oxcf->tool_cfg.superblock_size == AOM_SUPERBLOCK_SIZE_128X128)
759     return BLOCK_128X128;
760 
761   // Force 64x64 superblock size to increase resolution in perceptual
762   // AQ mode.
763   if (oxcf->mode == ALLINTRA &&
764       (oxcf->q_cfg.deltaq_mode == DELTA_Q_PERCEPTUAL_AI ||
765        oxcf->q_cfg.deltaq_mode == DELTA_Q_USER_RATING_BASED))
766     return BLOCK_64X64;
767 
768   assert(oxcf->tool_cfg.superblock_size == AOM_SUPERBLOCK_SIZE_DYNAMIC);
769 
770   if (number_spatial_layers > 1 ||
771       oxcf->resize_cfg.resize_mode != RESIZE_NONE) {
772     // Use the configured size (top resolution) for spatial layers or
773     // on resize.
774     return AOMMIN(oxcf->frm_dim_cfg.width, oxcf->frm_dim_cfg.height) > 480
775                ? BLOCK_128X128
776                : BLOCK_64X64;
777   }
778 
779   // TODO(any): Possibly could improve this with a heuristic.
780   // When superres / resize is on, 'cm->width / height' can change between
781   // calls, so we don't apply this heuristic there.
782   // Things break if superblock size changes between the first pass and second
783   // pass encoding, which is why this heuristic is not configured as a
784   // speed-feature.
785   if (oxcf->superres_cfg.superres_mode == AOM_SUPERRES_NONE &&
786       oxcf->resize_cfg.resize_mode == RESIZE_NONE &&
787       (oxcf->speed >= 1 || oxcf->mode == REALTIME)) {
788     return AOMMIN(width, height) > 480 ? BLOCK_128X128 : BLOCK_64X64;
789   }
790 
791   return BLOCK_128X128;
792 }
793 
av1_setup_frame(AV1_COMP * cpi)794 void av1_setup_frame(AV1_COMP *cpi) {
795   AV1_COMMON *const cm = &cpi->common;
796   // Set up entropy context depending on frame type. The decoder mandates
797   // the use of the default context, index 0, for keyframes and inter
798   // frames where the error_resilient_mode or intra_only flag is set. For
799   // other inter-frames the encoder currently uses only two contexts;
800   // context 1 for ALTREF frames and context 0 for the others.
801 
802   if (frame_is_intra_only(cm) || cm->features.error_resilient_mode ||
803       cpi->ext_flags.use_primary_ref_none) {
804     av1_setup_past_independence(cm);
805   }
806 
807   if ((cm->current_frame.frame_type == KEY_FRAME && cm->show_frame) ||
808       frame_is_sframe(cm)) {
809     if (!cpi->ppi->seq_params_locked) {
810       set_sb_size(cm->seq_params,
811                   av1_select_sb_size(&cpi->oxcf, cm->width, cm->height,
812                                      cpi->svc.number_spatial_layers));
813     }
814   } else {
815     const RefCntBuffer *const primary_ref_buf = get_primary_ref_frame_buf(cm);
816     if (primary_ref_buf == NULL) {
817       av1_setup_past_independence(cm);
818       cm->seg.update_map = 1;
819       cm->seg.update_data = 1;
820     } else {
821       *cm->fc = primary_ref_buf->frame_context;
822     }
823   }
824 
825   av1_zero(cm->cur_frame->interp_filter_selected);
826   cm->prev_frame = get_primary_ref_frame_buf(cm);
827   cpi->vaq_refresh = 0;
828 }
829 
830 #if !CONFIG_REALTIME_ONLY
get_interp_filter_selected(const AV1_COMMON * const cm,MV_REFERENCE_FRAME ref,InterpFilter ifilter)831 static int get_interp_filter_selected(const AV1_COMMON *const cm,
832                                       MV_REFERENCE_FRAME ref,
833                                       InterpFilter ifilter) {
834   const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref);
835   if (buf == NULL) return 0;
836   return buf->interp_filter_selected[ifilter];
837 }
838 
av1_setup_interp_filter_search_mask(AV1_COMP * cpi)839 uint16_t av1_setup_interp_filter_search_mask(AV1_COMP *cpi) {
840   const AV1_COMMON *const cm = &cpi->common;
841   int ref_total[REF_FRAMES] = { 0 };
842   uint16_t mask = ALLOW_ALL_INTERP_FILT_MASK;
843 
844   if (cpi->last_frame_type == KEY_FRAME || cpi->refresh_frame.alt_ref_frame)
845     return mask;
846 
847   for (MV_REFERENCE_FRAME ref = LAST_FRAME; ref <= ALTREF_FRAME; ++ref) {
848     for (InterpFilter ifilter = EIGHTTAP_REGULAR; ifilter <= MULTITAP_SHARP;
849          ++ifilter) {
850       ref_total[ref] += get_interp_filter_selected(cm, ref, ifilter);
851     }
852   }
853   int ref_total_total = (ref_total[LAST2_FRAME] + ref_total[LAST3_FRAME] +
854                          ref_total[GOLDEN_FRAME] + ref_total[BWDREF_FRAME] +
855                          ref_total[ALTREF2_FRAME] + ref_total[ALTREF_FRAME]);
856 
857   for (InterpFilter ifilter = EIGHTTAP_REGULAR; ifilter <= MULTITAP_SHARP;
858        ++ifilter) {
859     int last_score = get_interp_filter_selected(cm, LAST_FRAME, ifilter) * 30;
860     if (ref_total[LAST_FRAME] && last_score <= ref_total[LAST_FRAME]) {
861       int filter_score =
862           get_interp_filter_selected(cm, LAST2_FRAME, ifilter) * 20 +
863           get_interp_filter_selected(cm, LAST3_FRAME, ifilter) * 20 +
864           get_interp_filter_selected(cm, GOLDEN_FRAME, ifilter) * 20 +
865           get_interp_filter_selected(cm, BWDREF_FRAME, ifilter) * 10 +
866           get_interp_filter_selected(cm, ALTREF2_FRAME, ifilter) * 10 +
867           get_interp_filter_selected(cm, ALTREF_FRAME, ifilter) * 10;
868       if (filter_score < ref_total_total) {
869         DUAL_FILTER_TYPE filt_type = ifilter + SWITCHABLE_FILTERS * ifilter;
870         reset_interp_filter_allowed_mask(&mask, filt_type);
871       }
872     }
873   }
874   return mask;
875 }
876 
877 #define STRICT_PSNR_DIFF_THRESH 0.9
878 // Encode key frame with/without screen content tools to determine whether
879 // screen content tools should be enabled for this key frame group or not.
880 // The first encoding is without screen content tools.
881 // The second encoding is with screen content tools.
882 // We compare the psnr and frame size to make the decision.
screen_content_tools_determination(AV1_COMP * cpi,const int allow_screen_content_tools_orig_decision,const int allow_intrabc_orig_decision,const int use_screen_content_tools_orig_decision,const int is_screen_content_type_orig_decision,const int pass,int * projected_size_pass,PSNR_STATS * psnr)883 static void screen_content_tools_determination(
884     AV1_COMP *cpi, const int allow_screen_content_tools_orig_decision,
885     const int allow_intrabc_orig_decision,
886     const int use_screen_content_tools_orig_decision,
887     const int is_screen_content_type_orig_decision, const int pass,
888     int *projected_size_pass, PSNR_STATS *psnr) {
889   AV1_COMMON *const cm = &cpi->common;
890   FeatureFlags *const features = &cm->features;
891   projected_size_pass[pass] = cpi->rc.projected_frame_size;
892 #if CONFIG_AV1_HIGHBITDEPTH
893   const uint32_t in_bit_depth = cpi->oxcf.input_cfg.input_bit_depth;
894   const uint32_t bit_depth = cpi->td.mb.e_mbd.bd;
895   aom_calc_highbd_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr[pass],
896                        bit_depth, in_bit_depth);
897 #else
898   aom_calc_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr[pass]);
899 #endif
900   if (pass != 1) return;
901 
902   const double psnr_diff = psnr[1].psnr[0] - psnr[0].psnr[0];
903   const int is_sc_encoding_much_better = psnr_diff > STRICT_PSNR_DIFF_THRESH;
904   if (is_sc_encoding_much_better) {
905     // Use screen content tools, if we get coding gain.
906     features->allow_screen_content_tools = 1;
907     features->allow_intrabc = cpi->intrabc_used;
908     cpi->use_screen_content_tools = 1;
909     cpi->is_screen_content_type = 1;
910   } else {
911     // Use original screen content decision.
912     features->allow_screen_content_tools =
913         allow_screen_content_tools_orig_decision;
914     features->allow_intrabc = allow_intrabc_orig_decision;
915     cpi->use_screen_content_tools = use_screen_content_tools_orig_decision;
916     cpi->is_screen_content_type = is_screen_content_type_orig_decision;
917   }
918 }
919 
920 // Set some encoding parameters to make the encoding process fast.
921 // A fixed block partition size, and a large q is used.
set_encoding_params_for_screen_content(AV1_COMP * cpi,const int pass)922 static void set_encoding_params_for_screen_content(AV1_COMP *cpi,
923                                                    const int pass) {
924   AV1_COMMON *const cm = &cpi->common;
925   if (pass == 0) {
926     // In the first pass, encode without screen content tools.
927     // Use a high q, and a fixed block size for fast encoding.
928     cm->features.allow_screen_content_tools = 0;
929     cm->features.allow_intrabc = 0;
930     cpi->use_screen_content_tools = 0;
931     cpi->sf.part_sf.partition_search_type = FIXED_PARTITION;
932     cpi->sf.part_sf.fixed_partition_size = BLOCK_32X32;
933     return;
934   }
935   assert(pass == 1);
936   // In the second pass, encode with screen content tools.
937   // Use a high q, and a fixed block size for fast encoding.
938   cm->features.allow_screen_content_tools = 1;
939   // TODO(chengchen): turn intrabc on could lead to data race issue.
940   // cm->allow_intrabc = 1;
941   cpi->use_screen_content_tools = 1;
942   cpi->sf.part_sf.partition_search_type = FIXED_PARTITION;
943   cpi->sf.part_sf.fixed_partition_size = BLOCK_32X32;
944 }
945 
946 // Determines whether to use screen content tools for the key frame group.
947 // This function modifies "cm->features.allow_screen_content_tools",
948 // "cm->features.allow_intrabc" and "cpi->use_screen_content_tools".
av1_determine_sc_tools_with_encoding(AV1_COMP * cpi,const int q_orig)949 void av1_determine_sc_tools_with_encoding(AV1_COMP *cpi, const int q_orig) {
950   AV1_COMMON *const cm = &cpi->common;
951   const AV1EncoderConfig *const oxcf = &cpi->oxcf;
952   const QuantizationCfg *const q_cfg = &oxcf->q_cfg;
953   // Variables to help determine if we should allow screen content tools.
954   int projected_size_pass[3] = { 0 };
955   PSNR_STATS psnr[3];
956   const int is_key_frame = cm->current_frame.frame_type == KEY_FRAME;
957   const int allow_screen_content_tools_orig_decision =
958       cm->features.allow_screen_content_tools;
959   const int allow_intrabc_orig_decision = cm->features.allow_intrabc;
960   const int use_screen_content_tools_orig_decision =
961       cpi->use_screen_content_tools;
962   const int is_screen_content_type_orig_decision = cpi->is_screen_content_type;
963   // Turn off the encoding trial for forward key frame and superres.
964   if (cpi->sf.rt_sf.use_nonrd_pick_mode || oxcf->kf_cfg.fwd_kf_enabled ||
965       cpi->superres_mode != AOM_SUPERRES_NONE || oxcf->mode == REALTIME ||
966       use_screen_content_tools_orig_decision || !is_key_frame) {
967     return;
968   }
969 
970   // TODO(chengchen): multiple encoding for the lossless mode is time consuming.
971   // Find a better way to determine whether screen content tools should be used
972   // for lossless coding.
973   // Use a high q and a fixed partition to do quick encoding.
974   const int q_for_screen_content_quick_run =
975       is_lossless_requested(&oxcf->rc_cfg) ? q_orig : AOMMAX(q_orig, 244);
976   const int partition_search_type_orig = cpi->sf.part_sf.partition_search_type;
977   const BLOCK_SIZE fixed_partition_block_size_orig =
978       cpi->sf.part_sf.fixed_partition_size;
979 
980   // Setup necessary params for encoding, including frame source, etc.
981 
982   cpi->source =
983       av1_scale_if_required(cm, cpi->unscaled_source, &cpi->scaled_source,
984                             cm->features.interp_filter, 0, false, false);
985   if (cpi->unscaled_last_source != NULL) {
986     cpi->last_source = av1_scale_if_required(
987         cm, cpi->unscaled_last_source, &cpi->scaled_last_source,
988         cm->features.interp_filter, 0, false, false);
989   }
990 
991   av1_setup_frame(cpi);
992 
993   if (cm->seg.enabled) {
994     if (!cm->seg.update_data && cm->prev_frame) {
995       segfeatures_copy(&cm->seg, &cm->prev_frame->seg);
996       cm->seg.enabled = cm->prev_frame->seg.enabled;
997     } else {
998       av1_calculate_segdata(&cm->seg);
999     }
1000   } else {
1001     memset(&cm->seg, 0, sizeof(cm->seg));
1002   }
1003   segfeatures_copy(&cm->cur_frame->seg, &cm->seg);
1004   cm->cur_frame->seg.enabled = cm->seg.enabled;
1005 
1006   // The two encoding passes aim to help determine whether to use screen
1007   // content tools, with a high q and fixed partition.
1008   for (int pass = 0; pass < 2; ++pass) {
1009     set_encoding_params_for_screen_content(cpi, pass);
1010     av1_set_quantizer(cm, q_cfg->qm_minlevel, q_cfg->qm_maxlevel,
1011                       q_for_screen_content_quick_run,
1012                       q_cfg->enable_chroma_deltaq);
1013     av1_set_speed_features_qindex_dependent(cpi, oxcf->speed);
1014     if (q_cfg->deltaq_mode != NO_DELTA_Q || q_cfg->enable_chroma_deltaq)
1015       av1_init_quantizer(&cpi->enc_quant_dequant_params, &cm->quant_params,
1016                          cm->seq_params->bit_depth);
1017 
1018     av1_set_variance_partition_thresholds(cpi, q_for_screen_content_quick_run,
1019                                           0);
1020     // transform / motion compensation build reconstruction frame
1021     av1_encode_frame(cpi);
1022     // Screen content decision
1023     screen_content_tools_determination(
1024         cpi, allow_screen_content_tools_orig_decision,
1025         allow_intrabc_orig_decision, use_screen_content_tools_orig_decision,
1026         is_screen_content_type_orig_decision, pass, projected_size_pass, psnr);
1027   }
1028 
1029   // Set partition speed feature back.
1030   cpi->sf.part_sf.partition_search_type = partition_search_type_orig;
1031   cpi->sf.part_sf.fixed_partition_size = fixed_partition_block_size_orig;
1032 }
1033 #endif  // CONFIG_REALTIME_ONLY
1034 
fix_interp_filter(InterpFilter * const interp_filter,const FRAME_COUNTS * const counts)1035 static void fix_interp_filter(InterpFilter *const interp_filter,
1036                               const FRAME_COUNTS *const counts) {
1037   if (*interp_filter == SWITCHABLE) {
1038     // Check to see if only one of the filters is actually used
1039     int count[SWITCHABLE_FILTERS] = { 0 };
1040     int num_filters_used = 0;
1041     for (int i = 0; i < SWITCHABLE_FILTERS; ++i) {
1042       for (int j = 0; j < SWITCHABLE_FILTER_CONTEXTS; ++j)
1043         count[i] += counts->switchable_interp[j][i];
1044       num_filters_used += (count[i] > 0);
1045     }
1046     if (num_filters_used == 1) {
1047       // Only one filter is used. So set the filter at frame level
1048       for (int i = 0; i < SWITCHABLE_FILTERS; ++i) {
1049         if (count[i]) {
1050           if (i == EIGHTTAP_REGULAR) *interp_filter = i;
1051           break;
1052         }
1053       }
1054     }
1055   }
1056 }
1057 
av1_finalize_encoded_frame(AV1_COMP * const cpi)1058 void av1_finalize_encoded_frame(AV1_COMP *const cpi) {
1059   AV1_COMMON *const cm = &cpi->common;
1060   CurrentFrame *const current_frame = &cm->current_frame;
1061 
1062   if (!cm->seq_params->reduced_still_picture_hdr &&
1063       encode_show_existing_frame(cm)) {
1064     RefCntBuffer *const frame_to_show =
1065         cm->ref_frame_map[cpi->existing_fb_idx_to_show];
1066 
1067     if (frame_to_show == NULL) {
1068       aom_internal_error(cm->error, AOM_CODEC_UNSUP_BITSTREAM,
1069                          "Buffer does not contain a reconstructed frame");
1070     }
1071     assert(frame_to_show->ref_count > 0);
1072     assign_frame_buffer_p(&cm->cur_frame, frame_to_show);
1073   }
1074 
1075   if (!encode_show_existing_frame(cm) &&
1076       cm->seq_params->film_grain_params_present &&
1077       (cm->show_frame || cm->showable_frame)) {
1078     // Copy the current frame's film grain params to the its corresponding
1079     // RefCntBuffer slot.
1080     cm->cur_frame->film_grain_params = cm->film_grain_params;
1081 
1082     // We must update the parameters if this is not an INTER_FRAME
1083     if (current_frame->frame_type != INTER_FRAME)
1084       cm->cur_frame->film_grain_params.update_parameters = 1;
1085 
1086     // Iterate the random seed for the next frame.
1087     cm->film_grain_params.random_seed += 3381;
1088     if (cm->film_grain_params.random_seed == 0)
1089       cm->film_grain_params.random_seed = 7391;
1090   }
1091 
1092   // Initialise all tiles' contexts from the global frame context
1093   for (int tile_col = 0; tile_col < cm->tiles.cols; tile_col++) {
1094     for (int tile_row = 0; tile_row < cm->tiles.rows; tile_row++) {
1095       const int tile_idx = tile_row * cm->tiles.cols + tile_col;
1096       cpi->tile_data[tile_idx].tctx = *cm->fc;
1097     }
1098   }
1099 
1100   fix_interp_filter(&cm->features.interp_filter, cpi->td.counts);
1101 }
1102 
av1_is_integer_mv(const YV12_BUFFER_CONFIG * cur_picture,const YV12_BUFFER_CONFIG * last_picture,ForceIntegerMVInfo * const force_intpel_info)1103 int av1_is_integer_mv(const YV12_BUFFER_CONFIG *cur_picture,
1104                       const YV12_BUFFER_CONFIG *last_picture,
1105                       ForceIntegerMVInfo *const force_intpel_info) {
1106   // check use hash ME
1107   int k;
1108 
1109   const int block_size = FORCE_INT_MV_DECISION_BLOCK_SIZE;
1110   const double threshold_current = 0.8;
1111   const double threshold_average = 0.95;
1112   const int max_history_size = 32;
1113   int T = 0;  // total block
1114   int C = 0;  // match with collocated block
1115   int S = 0;  // smooth region but not match with collocated block
1116 
1117   const int pic_width = cur_picture->y_width;
1118   const int pic_height = cur_picture->y_height;
1119   for (int i = 0; i + block_size <= pic_height; i += block_size) {
1120     for (int j = 0; j + block_size <= pic_width; j += block_size) {
1121       const int x_pos = j;
1122       const int y_pos = i;
1123       int match = 1;
1124       T++;
1125 
1126       // check whether collocated block match with current
1127       uint8_t *p_cur = cur_picture->y_buffer;
1128       uint8_t *p_ref = last_picture->y_buffer;
1129       int stride_cur = cur_picture->y_stride;
1130       int stride_ref = last_picture->y_stride;
1131       p_cur += (y_pos * stride_cur + x_pos);
1132       p_ref += (y_pos * stride_ref + x_pos);
1133 
1134       if (cur_picture->flags & YV12_FLAG_HIGHBITDEPTH) {
1135         uint16_t *p16_cur = CONVERT_TO_SHORTPTR(p_cur);
1136         uint16_t *p16_ref = CONVERT_TO_SHORTPTR(p_ref);
1137         for (int tmpY = 0; tmpY < block_size && match; tmpY++) {
1138           for (int tmpX = 0; tmpX < block_size && match; tmpX++) {
1139             if (p16_cur[tmpX] != p16_ref[tmpX]) {
1140               match = 0;
1141             }
1142           }
1143           p16_cur += stride_cur;
1144           p16_ref += stride_ref;
1145         }
1146       } else {
1147         for (int tmpY = 0; tmpY < block_size && match; tmpY++) {
1148           for (int tmpX = 0; tmpX < block_size && match; tmpX++) {
1149             if (p_cur[tmpX] != p_ref[tmpX]) {
1150               match = 0;
1151             }
1152           }
1153           p_cur += stride_cur;
1154           p_ref += stride_ref;
1155         }
1156       }
1157 
1158       if (match) {
1159         C++;
1160         continue;
1161       }
1162 
1163       if (av1_hash_is_horizontal_perfect(cur_picture, block_size, x_pos,
1164                                          y_pos) ||
1165           av1_hash_is_vertical_perfect(cur_picture, block_size, x_pos, y_pos)) {
1166         S++;
1167         continue;
1168       }
1169     }
1170   }
1171 
1172   assert(T > 0);
1173   double cs_rate = ((double)(C + S)) / ((double)(T));
1174 
1175   force_intpel_info->cs_rate_array[force_intpel_info->rate_index] = cs_rate;
1176 
1177   force_intpel_info->rate_index =
1178       (force_intpel_info->rate_index + 1) % max_history_size;
1179   force_intpel_info->rate_size++;
1180   force_intpel_info->rate_size =
1181       AOMMIN(force_intpel_info->rate_size, max_history_size);
1182 
1183   if (cs_rate < threshold_current) {
1184     return 0;
1185   }
1186 
1187   if (C == T) {
1188     return 1;
1189   }
1190 
1191   double cs_average = 0.0;
1192 
1193   for (k = 0; k < force_intpel_info->rate_size; k++) {
1194     cs_average += force_intpel_info->cs_rate_array[k];
1195   }
1196   cs_average /= force_intpel_info->rate_size;
1197 
1198   if (cs_average < threshold_average) {
1199     return 0;
1200   }
1201 
1202   if ((T - C - S) < 0) {
1203     return 1;
1204   }
1205 
1206   if (cs_average > 1.01) {
1207     return 1;
1208   }
1209 
1210   return 0;
1211 }
1212 
av1_set_mb_ssim_rdmult_scaling(AV1_COMP * cpi)1213 void av1_set_mb_ssim_rdmult_scaling(AV1_COMP *cpi) {
1214   const CommonModeInfoParams *const mi_params = &cpi->common.mi_params;
1215   ThreadData *td = &cpi->td;
1216   MACROBLOCK *x = &td->mb;
1217   MACROBLOCKD *xd = &x->e_mbd;
1218   uint8_t *y_buffer = cpi->source->y_buffer;
1219   const int y_stride = cpi->source->y_stride;
1220   const int block_size = BLOCK_16X16;
1221 
1222   const int num_mi_w = mi_size_wide[block_size];
1223   const int num_mi_h = mi_size_high[block_size];
1224   const int num_cols = (mi_params->mi_cols + num_mi_w - 1) / num_mi_w;
1225   const int num_rows = (mi_params->mi_rows + num_mi_h - 1) / num_mi_h;
1226   double log_sum = 0.0;
1227   const int use_hbd = cpi->source->flags & YV12_FLAG_HIGHBITDEPTH;
1228 
1229   // Loop through each 16x16 block.
1230   for (int row = 0; row < num_rows; ++row) {
1231     for (int col = 0; col < num_cols; ++col) {
1232       double var = 0.0, num_of_var = 0.0;
1233       const int index = row * num_cols + col;
1234 
1235       // Loop through each 8x8 block.
1236       for (int mi_row = row * num_mi_h;
1237            mi_row < mi_params->mi_rows && mi_row < (row + 1) * num_mi_h;
1238            mi_row += 2) {
1239         for (int mi_col = col * num_mi_w;
1240              mi_col < mi_params->mi_cols && mi_col < (col + 1) * num_mi_w;
1241              mi_col += 2) {
1242           struct buf_2d buf;
1243           const int row_offset_y = mi_row << 2;
1244           const int col_offset_y = mi_col << 2;
1245 
1246           buf.buf = y_buffer + row_offset_y * y_stride + col_offset_y;
1247           buf.stride = y_stride;
1248 
1249           if (use_hbd) {
1250             var += av1_high_get_sby_perpixel_variance(cpi, &buf, BLOCK_8X8,
1251                                                       xd->bd);
1252           } else {
1253             var += av1_get_sby_perpixel_variance(cpi, &buf, BLOCK_8X8);
1254           }
1255 
1256           num_of_var += 1.0;
1257         }
1258       }
1259       var = var / num_of_var;
1260 
1261       // Curve fitting with an exponential model on all 16x16 blocks from the
1262       // midres dataset.
1263       var = 67.035434 * (1 - exp(-0.0021489 * var)) + 17.492222;
1264       cpi->ssim_rdmult_scaling_factors[index] = var;
1265       log_sum += log(var);
1266     }
1267   }
1268   log_sum = exp(log_sum / (double)(num_rows * num_cols));
1269 
1270   for (int row = 0; row < num_rows; ++row) {
1271     for (int col = 0; col < num_cols; ++col) {
1272       const int index = row * num_cols + col;
1273       cpi->ssim_rdmult_scaling_factors[index] /= log_sum;
1274     }
1275   }
1276 }
1277 
1278 // Coding context that only needs to be saved when recode loop includes
1279 // filtering (deblocking, CDEF, superres post-encode upscale and/or loop
1280 // restoraton).
save_extra_coding_context(AV1_COMP * cpi)1281 static void save_extra_coding_context(AV1_COMP *cpi) {
1282   CODING_CONTEXT *const cc = &cpi->coding_context;
1283   AV1_COMMON *cm = &cpi->common;
1284 
1285   cc->lf = cm->lf;
1286   cc->cdef_info = cm->cdef_info;
1287   cc->rc = cpi->rc;
1288   cc->mv_stats = cpi->ppi->mv_stats;
1289 }
1290 
av1_save_all_coding_context(AV1_COMP * cpi)1291 void av1_save_all_coding_context(AV1_COMP *cpi) {
1292   save_extra_coding_context(cpi);
1293   if (!frame_is_intra_only(&cpi->common)) release_scaled_references(cpi);
1294 }
1295 
1296 #if DUMP_RECON_FRAMES == 1
1297 
1298 // NOTE(zoeliu): For debug - Output the filtered reconstructed video.
av1_dump_filtered_recon_frames(AV1_COMP * cpi)1299 void av1_dump_filtered_recon_frames(AV1_COMP *cpi) {
1300   AV1_COMMON *const cm = &cpi->common;
1301   const CurrentFrame *const current_frame = &cm->current_frame;
1302   const YV12_BUFFER_CONFIG *recon_buf = &cm->cur_frame->buf;
1303 
1304   if (recon_buf == NULL) {
1305     printf("Frame %d is not ready.\n", current_frame->frame_number);
1306     return;
1307   }
1308 
1309   static const int flag_list[REF_FRAMES] = { 0,
1310                                              AOM_LAST_FLAG,
1311                                              AOM_LAST2_FLAG,
1312                                              AOM_LAST3_FLAG,
1313                                              AOM_GOLD_FLAG,
1314                                              AOM_BWD_FLAG,
1315                                              AOM_ALT2_FLAG,
1316                                              AOM_ALT_FLAG };
1317   printf(
1318       "\n***Frame=%d (frame_offset=%d, show_frame=%d, "
1319       "show_existing_frame=%d) "
1320       "[LAST LAST2 LAST3 GOLDEN BWD ALT2 ALT]=[",
1321       current_frame->frame_number, current_frame->order_hint, cm->show_frame,
1322       cm->show_existing_frame);
1323   for (int ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) {
1324     const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref_frame);
1325     const int ref_offset = buf != NULL ? (int)buf->order_hint : -1;
1326     printf(" %d(%c)", ref_offset,
1327            (cpi->ref_frame_flags & flag_list[ref_frame]) ? 'Y' : 'N');
1328   }
1329   printf(" ]\n");
1330 
1331   if (!cm->show_frame) {
1332     printf("Frame %d is a no show frame, so no image dump.\n",
1333            current_frame->frame_number);
1334     return;
1335   }
1336 
1337   int h;
1338   char file_name[256] = "/tmp/enc_filtered_recon.yuv";
1339   FILE *f_recon = NULL;
1340 
1341   if (current_frame->frame_number == 0) {
1342     if ((f_recon = fopen(file_name, "wb")) == NULL) {
1343       printf("Unable to open file %s to write.\n", file_name);
1344       return;
1345     }
1346   } else {
1347     if ((f_recon = fopen(file_name, "ab")) == NULL) {
1348       printf("Unable to open file %s to append.\n", file_name);
1349       return;
1350     }
1351   }
1352   printf(
1353       "\nFrame=%5d, encode_update_type[%5d]=%1d, frame_offset=%d, "
1354       "show_frame=%d, show_existing_frame=%d, source_alt_ref_active=%d, "
1355       "refresh_alt_ref_frame=%d, "
1356       "y_stride=%4d, uv_stride=%4d, cm->width=%4d, cm->height=%4d\n\n",
1357       current_frame->frame_number, cpi->gf_frame_index,
1358       cpi->ppi->gf_group.update_type[cpi->gf_frame_index],
1359       current_frame->order_hint, cm->show_frame, cm->show_existing_frame,
1360       cpi->rc.source_alt_ref_active, cpi->refresh_frame.alt_ref_frame,
1361       recon_buf->y_stride, recon_buf->uv_stride, cm->width, cm->height);
1362 #if 0
1363   int ref_frame;
1364   printf("get_ref_frame_map_idx: [");
1365   for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame)
1366     printf(" %d", get_ref_frame_map_idx(cm, ref_frame));
1367   printf(" ]\n");
1368 #endif  // 0
1369 
1370   // --- Y ---
1371   for (h = 0; h < cm->height; ++h) {
1372     fwrite(&recon_buf->y_buffer[h * recon_buf->y_stride], 1, cm->width,
1373            f_recon);
1374   }
1375   // --- U ---
1376   for (h = 0; h < (cm->height >> 1); ++h) {
1377     fwrite(&recon_buf->u_buffer[h * recon_buf->uv_stride], 1, (cm->width >> 1),
1378            f_recon);
1379   }
1380   // --- V ---
1381   for (h = 0; h < (cm->height >> 1); ++h) {
1382     fwrite(&recon_buf->v_buffer[h * recon_buf->uv_stride], 1, (cm->width >> 1),
1383            f_recon);
1384   }
1385 
1386   fclose(f_recon);
1387 }
1388 #endif  // DUMP_RECON_FRAMES
1389