• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright Samsung Electronics Co.,LTD.
3  * Copyright (C) 2017 The Android Open Source Project
4  *
5  * Licensed under the Apache License, Version 2.0 (the "License");
6  * you may not use this file except in compliance with the License.
7  * You may obtain a copy of the License at
8  *
9  *     http://www.apache.org/licenses/LICENSE-2.0
10  *
11  * Unless required by applicable law or agreed to in writing, software
12  * distributed under the License is distributed on an "AS IS" BASIS,
13  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14  * See the License for the specific language governing permissions and
15  * limitations under the License.
16  */
17 
18 #define ATRACE_TAG (ATRACE_TAG_GRAPHICS | ATRACE_TAG_HAL)
19 
20 #include "acrylic_g2d.h"
21 
22 #include <alloca.h>
23 #include <exynos_format.h> // hardware/smasung_slsi/exynos/include
24 #include <hardware/hwcomposer2.h>
25 #include <log/log.h>
26 #include <mali_gralloc_formats.h>
27 #include <sys/ioctl.h>
28 #include <system/graphics.h>
29 #include <utils/Trace.h>
30 
31 #include <algorithm>
32 #include <cstring>
33 
34 enum {
35     G2D_CSC_STD_UNDEFINED = -1,
36     G2D_CSC_STD_601       = 0,
37     G2D_CSC_STD_709       = 1,
38     G2D_CSC_STD_2020      = 2,
39     G2D_CSC_STD_P3        = 3,
40 
41     G2D_CSC_STD_COUNT     = 4,
42 };
43 
44 enum {
45     G2D_CSC_RANGE_LIMITED,
46     G2D_CSC_RANGE_FULL,
47 
48     G2D_CSC_RANGE_COUNT,
49 };
50 
51 static char csc_std_to_matrix_index[] = {
52     G2D_CSC_STD_709,                          // HAL_DATASPACE_STANDARD_UNSPECIFIED
53     G2D_CSC_STD_709,                          // HAL_DATASPACE_STANDARD_BT709
54     G2D_CSC_STD_601,                          // HAL_DATASPACE_STANDARD_BT601_625
55     G2D_CSC_STD_601,                          // HAL_DATASPACE_STANDARD_BT601_625_UNADJUSTED
56     G2D_CSC_STD_601,                          // HAL_DATASPACE_STANDARD_BT601_525
57     G2D_CSC_STD_601,                          // HAL_DATASPACE_STANDARD_BT601_525_UNADJUSTED
58     G2D_CSC_STD_2020,                         // HAL_DATASPACE_STANDARD_BT2020
59     G2D_CSC_STD_2020,                         // HAL_DATASPACE_STANDARD_BT2020_CONSTANT_LUMINANCE
60     static_cast<char>(G2D_CSC_STD_UNDEFINED), // HAL_DATASPACE_STANDARD_BT470M
61     G2D_CSC_STD_709,                          // HAL_DATASPACE_STANDARD_FILM
62     G2D_CSC_STD_P3,                           // HAL_DATASPACE_STANDARD_DCI_P3
63     static_cast<char>(G2D_CSC_STD_UNDEFINED), // HAL_DATASPACE_STANDARD_ADOBE_RGB
64 };
65 
66 static uint16_t YCbCr2sRGBCoefficients[G2D_CSC_STD_COUNT * G2D_CSC_RANGE_COUNT][9] = {
67     {0x0254, 0x0000, 0x0331, 0x0254, 0xFF37, 0xFE60, 0x0254, 0x0409, 0x0000}, // 601 limited
68     {0x0200, 0x0000, 0x02BE, 0x0200, 0xFF54, 0xFE9B, 0x0200, 0x0377, 0x0000}, // 601 full
69     {0x0254, 0x0000, 0x0396, 0x0254, 0xFF93, 0xFEEF, 0x0254, 0x043A, 0x0000}, // 709 limited
70     {0x0200, 0x0000, 0x0314, 0x0200, 0xFFA2, 0xFF16, 0x0200, 0x03A1, 0x0000}, // 709 full
71     {0x0254, 0x0000, 0x035B, 0x0254, 0xFFA0, 0xFEB3, 0x0254, 0x0449, 0x0000}, // 2020 limited
72     {0x0200, 0x0000, 0x02E2, 0x0200, 0xFFAE, 0xFEE2, 0x0200, 0x03AE, 0x0000}, // 2020 full
73     {0x0254, 0x0000, 0x03AE, 0x0254, 0xFF96, 0xFEEE, 0x0254, 0x0456, 0x0000}, // DCI-P3 limited
74     {0x0200, 0x0000, 0x0329, 0x0200, 0xFFA5, 0xFF15, 0x0200, 0x03B9, 0x0000}, // DCI-P3 full
75 };
76 
77 static uint16_t sRGB2YCbCrCoefficients[G2D_CSC_STD_COUNT * G2D_CSC_RANGE_COUNT][9] = {
78     {0x0083, 0x0102, 0x0032, 0xFFB4, 0xFF6B, 0x00E1, 0x00E1, 0xFF44, 0xFFDB}, // 601 limited
79     {0x0099, 0x012D, 0x003A, 0xFFA8, 0xFF53, 0x0106, 0x0106, 0xFF25, 0xFFD5}, // 601 full
80     {0x005D, 0x013A, 0x0020, 0xFFCC, 0xFF53, 0x00E1, 0x00E1, 0xFF34, 0xFFEB}, // 709 limited
81     {0x006D, 0x016E, 0x0025, 0xFFC4, 0xFF36, 0x0106, 0x0106, 0xFF12, 0xFFE8}, // 709 full
82     {0x0074, 0x012A, 0x001A, 0xFFC1, 0xFF5A, 0x00E1, 0x00E1, 0xFF31, 0xFFEE}, // 2020 limited
83     {0x0087, 0x015B, 0x001E, 0xFFB7, 0xFF43, 0x0106, 0x0106, 0xFF0F, 0xFFEB}, // 2020 full
84     {0x006B, 0x0171, 0x0023, 0xFFC6, 0xFF3A, 0x0100, 0x0100, 0xFF16, 0xFFEA}, // DCI-P3 limited(full)
85     {0x006B, 0x0171, 0x0023, 0xFFC6, 0xFF3A, 0x0100, 0x0100, 0xFF16, 0xFFEA}, // DCI-P3 full
86 };
87 
88 #define CSC_MATRIX_REGISTER_COUNT 9
89 #define CSC_MATRIX_REGISTER_SIZE  (CSC_MATRIX_REGISTER_COUNT * sizeof(uint32_t))
90 
g2dfmt_is_ycbcr(unsigned int g2dfmt)91 static inline bool g2dfmt_is_ycbcr(unsigned int g2dfmt)
92 {
93     g2dfmt &= G2D_DATAFMT_MASK;
94     return (G2D_DATAFMT_YUV_MIN <= g2dfmt) && (g2dfmt <= G2D_DATAFMT_YUV_MAX);
95 }
96 
97 class CSCMatrixWriter {
98     enum { CSC_MATRIX_MAX_COUNT = 4, CSC_MATRIX_INVALID_INDEX = 200 };
99     enum { CSC_MATRIX_SRC_BASE = 0x2000, CSC_MATRIX_DST_BASE = 0x2100 };
100 public:
CSCMatrixWriter(unsigned int g2dfmt,unsigned int dataspace,uint32_t * command)101     CSCMatrixWriter(unsigned int g2dfmt, unsigned int dataspace, uint32_t *command)
102                     : mMatrixCount(0), mMatrixTargetIndex(CSC_MATRIX_INVALID_INDEX) {
103         // Ignore if unsupported dataspace is specified.
104         // G2D also works for the case.
105         // But the correctness of the result is not guaranteed.
106         if (g2dfmt_is_ycbcr(g2dfmt)) {
107             mMatrixTargetIndex = findMatrixIndex(dataspace);
108             if ((dataspace & HAL_DATASPACE_RANGE_FULL) != 0)
109                 *command = G2D_LAYER_YCBCRMODE_WIDE;
110         }
111     }
112 
configure(unsigned int g2dfmt,unsigned int dataspace,uint32_t * command)113     bool configure(unsigned int g2dfmt, unsigned int dataspace, uint32_t *command) {
114         if (!g2dfmt_is_ycbcr(g2dfmt))
115             return true;
116 
117         unsigned int spcidx = findMatrixIndex(dataspace);
118 
119         if (spcidx == CSC_MATRIX_INVALID_INDEX)
120             return false;
121 
122         if ((dataspace & HAL_DATASPACE_RANGE_FULL) != 0)
123             *command = G2D_LAYER_YCBCRMODE_WIDE;
124 
125         for (int i = 0; i < mMatrixCount; i++) {
126             if (mMatrixIndex[i] == spcidx) {
127                 *command |= i;
128                 return true;
129             }
130         }
131 
132         if (mMatrixCount == CSC_MATRIX_MAX_COUNT) {
133             ALOGE("Too many CSC requirements");
134             return false;
135         }
136 
137         mMatrixIndex[mMatrixCount] = spcidx;
138 
139         *command |= mMatrixCount++;
140 
141         return true;
142     }
143 
getRegisterCount()144     unsigned int getRegisterCount() {
145         unsigned int count = CSC_MATRIX_REGISTER_COUNT * mMatrixCount;
146         if (mMatrixTargetIndex != CSC_MATRIX_INVALID_INDEX)
147             count += CSC_MATRIX_REGISTER_COUNT;
148         return count;
149     }
150 
write(g2d_reg regs[])151     unsigned int write(g2d_reg regs[]) {
152         unsigned int count = 0;
153 
154         if (mMatrixTargetIndex != CSC_MATRIX_INVALID_INDEX) {
155             writeSingle(CSC_MATRIX_DST_BASE,
156                         &regs[count], sRGB2YCbCrCoefficients[mMatrixTargetIndex]);
157             count += CSC_MATRIX_REGISTER_COUNT;
158         }
159 
160         for (int m = 0; m < mMatrixCount; m++) {
161             writeSingle(CSC_MATRIX_SRC_BASE + m * CSC_MATRIX_REGISTER_SIZE,
162                         &regs[count], YCbCr2sRGBCoefficients[mMatrixIndex[m]]);
163             count += CSC_MATRIX_REGISTER_COUNT;
164         }
165 
166         return count;
167     }
168 
169 private:
writeSingle(unsigned int base,g2d_reg regs[],uint16_t matrix[9])170     void writeSingle(unsigned int base, g2d_reg regs[], uint16_t matrix[9]) {
171         for (unsigned int idx = 0; idx < CSC_MATRIX_REGISTER_COUNT; idx++) {
172             regs[idx].offset = base;
173             regs[idx].value = matrix[idx];
174             base += sizeof(uint32_t);
175         }
176     }
177 
findMatrixIndex(unsigned int dataspace)178     unsigned int findMatrixIndex(unsigned int dataspace) {
179         unsigned int index, colorspace;
180 
181         colorspace = (dataspace & HAL_DATASPACE_STANDARD_MASK) >> HAL_DATASPACE_STANDARD_SHIFT;
182         if (colorspace >= ARRSIZE(csc_std_to_matrix_index)) {
183             ALOGE("Data space %d is not supported by G2D", dataspace);
184             return CSC_MATRIX_INVALID_INDEX;
185         }
186 
187         index = csc_std_to_matrix_index[colorspace] * G2D_CSC_RANGE_COUNT;
188         if ((dataspace & HAL_DATASPACE_RANGE_FULL) != 0)
189             index++;
190 
191         return index;
192     }
193 
194     unsigned int mMatrixIndex[CSC_MATRIX_MAX_COUNT];
195     int mMatrixCount;
196     unsigned int mMatrixTargetIndex;
197 };
198 
199 #define G2D_FILTER_COEF_BASE 0x6000
200 #define G2D_FILTER_COEF_REG(idx) (0x6000 + (idx) * 0x400)
201 #define G2D_FILTER_C_OFFSET 0x200
202 #define G2D_SCALE_FACTOR(from, to) ((static_cast<uint32_t>(from) << G2D_SCALEFACTOR_FRACBITS) / (to))
203 
204 #define SI11(v)                              static_cast<uint32_t>((v) & 0x7FF)
205 #define FILTER_HCOEF(a, b, c, d, e, f, g, h) {SI11(a), SI11(b), SI11(c), SI11(d), SI11(e), SI11(f), SI11(g), SI11(h)}
206 #define FILTER_VCOEF(a, b, c, d)             {SI11(a), SI11(b), SI11(c), SI11(d)}
207 
208 #define NUM_HORI_COEFFICIENTS 8
209 #define NUM_VERT_COEFFICIENTS 4
210 #define NUM_FILTER_PHASE 9
211 #define NUM_FILTER_COEF_SETS 7
212 
213 #define NUM_VERT_COEF_REGS (NUM_FILTER_PHASE * NUM_VERT_COEFFICIENTS)
214 #define NUM_HORI_COEF_REGS (NUM_FILTER_PHASE * NUM_HORI_COEFFICIENTS)
215 
216 static uint32_t g2dHoriFilterCoef[NUM_FILTER_COEF_SETS][NUM_FILTER_PHASE][NUM_HORI_COEFFICIENTS] = {
217     { // Upsampling
218         FILTER_HCOEF(   0,   0,   0, 512,   0,   0,   0,   0), FILTER_HCOEF(  -2,   8, -25, 509,  30,  -9,   2,  -1), FILTER_HCOEF(  -4,  14, -46, 499,  64, -19,   5,  -1),
219         FILTER_HCOEF(  -5,  20, -62, 482, 101, -30,   8,  -2), FILTER_HCOEF(  -5,  23, -73, 458, 142, -41,  12,  -3), FILTER_HCOEF(  -6,  25, -80, 429, 185, -53,  15,  -3),
220         FILTER_HCOEF(  -6,  26, -83, 395, 228, -63,  19,  -4), FILTER_HCOEF(  -6,  25, -82, 357, 273, -71,  21,  -5), FILTER_HCOEF(  -5,  23, -78, 316, 316, -78,  23,  -5),
221     }, { // x7/8 Downsampling
222         FILTER_HCOEF(  12, -32,  56, 444,  52, -32,  12,   0), FILTER_HCOEF(   9, -24,  29, 445,  82, -39,  13,  -3), FILTER_HCOEF(   7, -16,   6, 438, 112, -46,  14,  -3),
223         FILTER_HCOEF(   5,  -9, -14, 426, 144, -52,  15,  -3), FILTER_HCOEF(   3,  -3, -30, 410, 177, -58,  16,  -3), FILTER_HCOEF(   2,   2, -43, 390, 211, -63,  16,  -3),
224         FILTER_HCOEF(   1,   7, -53, 365, 244, -66,  16,  -2), FILTER_HCOEF(   0,  10, -60, 338, 277, -66,  15,  -2), FILTER_HCOEF(  -1,  13, -65, 309, 309, -65,  13,  -1),
225     }, { // x6/8 Downsampling
226         FILTER_HCOEF(   8, -44, 100, 384, 100, -44,   8,   0), FILTER_HCOEF(   9, -40,  77, 382, 123, -47,   8,   0), FILTER_HCOEF(   8, -36,  57, 377, 147, -49,   7,   1),
227         FILTER_HCOEF(   8, -32,  38, 369, 171, -49,   5,   2), FILTER_HCOEF(   8, -27,  20, 358, 196, -48,   3,   2), FILTER_HCOEF(   7, -22,   5, 344, 221, -47,   1,   3),
228         FILTER_HCOEF(   7, -18,  -9, 329, 245, -43,  -2,   3), FILTER_HCOEF(   5, -13, -20, 310, 268, -37,  -5,   4), FILTER_HCOEF(   5,  -9, -30, 290, 290, -30,  -9,   5),
229     }, { // x5/8 Downsampling
230         FILTER_HCOEF(  -3, -31, 130, 320, 130, -31,  -3,   0), FILTER_HCOEF(  -3, -32, 113, 319, 147, -29,  -6,   3), FILTER_HCOEF(  -1, -33,  97, 315, 165, -26,  -8,   3),
231         FILTER_HCOEF(   0, -32,  81, 311, 182, -22, -11,   3), FILTER_HCOEF(   1, -31,  66, 304, 199, -17, -13,   3), FILTER_HCOEF(   2, -30,  52, 296, 216, -11, -16,   3),
232         FILTER_HCOEF(   2, -28,  38, 286, 232,  -3, -18,   3), FILTER_HCOEF(   3, -25,  26, 274, 247,   5, -21,   3), FILTER_HCOEF(   3, -23,  15, 261, 261,  15, -23,   3),
233     }, { // x4/8 Downsampling
234         FILTER_HCOEF( -11,   0, 140, 255, 140,   0, -12,   0), FILTER_HCOEF( -10,  -4, 129, 254, 151,   5, -13,   0), FILTER_HCOEF(  -9,  -7, 117, 253, 163,  10, -14,  -1),
235         FILTER_HCOEF(  -8, -10, 106, 250, 174,  16, -15,  -1), FILTER_HCOEF(  -7, -12,  95, 246, 185,  22, -16,  -1), FILTER_HCOEF(  -6, -14,  85, 241, 195,  29, -16,  -2),
236         FILTER_HCOEF(  -5, -15,  74, 236, 204,  37, -17,  -2), FILTER_HCOEF(  -5, -16,  64, 229, 214,  46, -17,  -3), FILTER_HCOEF(  -4, -17,  55, 222, 222,  55, -17,  -4),
237     }, { // x3/8 Downsampling
238         FILTER_HCOEF(  -5,  31, 133, 195, 133,  31,  -6,   0), FILTER_HCOEF(  -5,  27, 126, 195, 139,  37,  -4,  -3), FILTER_HCOEF(  -5,  23, 119, 194, 146,  41,  -3,  -3),
239         FILTER_HCOEF(  -5,  19, 112, 193, 152,  47,  -2,  -4), FILTER_HCOEF(  -5,  16, 105, 191, 158,  53,  -2,  -4), FILTER_HCOEF(  -5,  12,  98, 189, 163,  59,   0,  -4),
240         FILTER_HCOEF(  -5,  10,  91, 185, 169,  65,   1,  -4), FILTER_HCOEF(  -5,   7,  84, 182, 174,  71,   3,  -4), FILTER_HCOEF(  -5,   5,  78, 178, 178,  78,   5,  -5),
241     }, { // x2/8 Downsampling
242         FILTER_HCOEF(  10,  52, 118, 152, 118,  52,  10,   0), FILTER_HCOEF(   9,  48, 114, 152, 122,  56,  11,   0), FILTER_HCOEF(   7,  45, 110, 151, 125,  60,  13,   1),
243         FILTER_HCOEF(   6,  41, 106, 150, 129,  64,  15,   1), FILTER_HCOEF(   5,  38, 102, 149, 132,  68,  17,   1), FILTER_HCOEF(   4,  35,  98, 148, 135,  72,  19,   1),
244         FILTER_HCOEF(   4,  31,  94, 146, 138,  77,  21,   1), FILTER_HCOEF(   3,  29,  89, 145, 140,  81,  23,   2), FILTER_HCOEF(   2,  26,  85, 143, 143,  85,  26,   2),
245     }
246 };
247 
248 static uint32_t g2dVertFilterCoef[NUM_FILTER_COEF_SETS][NUM_FILTER_PHASE][NUM_VERT_COEFFICIENTS] = {
249     {    // Upsampling
250         FILTER_VCOEF(   0, 512,   0,   0), FILTER_VCOEF( -15, 508,  20,  -1), FILTER_VCOEF( -25, 495,  45,  -3),
251         FILTER_VCOEF( -31, 473,  75,  -5), FILTER_VCOEF( -33, 443, 110,  -8), FILTER_VCOEF( -33, 408, 148, -11),
252         FILTER_VCOEF( -31, 367, 190, -14), FILTER_VCOEF( -27, 324, 234, -19), FILTER_VCOEF( -23, 279, 279, -23),
253     }, { // x7/8 Downsampling
254         FILTER_VCOEF(  32, 448,  32,   0), FILTER_VCOEF(  17, 446,  55,  -6), FILTER_VCOEF(   3, 437,  79,  -7),
255         FILTER_VCOEF(  -7, 421, 107,  -9), FILTER_VCOEF( -14, 399, 138, -11), FILTER_VCOEF( -18, 373, 170, -13),
256         FILTER_VCOEF( -20, 343, 204, -15), FILTER_VCOEF( -20, 310, 240, -18), FILTER_VCOEF( -19, 275, 275, -19),
257     }, { // x6/8 Downsampling
258         FILTER_VCOEF(  61, 390,  61,   0), FILTER_VCOEF(  46, 390,  83,  -7), FILTER_VCOEF(  31, 383, 106,  -8),
259         FILTER_VCOEF(  19, 371, 130,  -8), FILTER_VCOEF(   9, 356, 156,  -9), FILTER_VCOEF(   2, 337, 183, -10),
260         FILTER_VCOEF(  -3, 315, 210, -10), FILTER_VCOEF(  -7, 291, 238, -10), FILTER_VCOEF(  -9, 265, 265,  -9),
261     }, { // x5/8 Downsampling
262         FILTER_VCOEF(  85, 341,  86,   0), FILTER_VCOEF(  71, 341, 105,  -5), FILTER_VCOEF(  56, 336, 124,  -4),
263         FILTER_VCOEF(  43, 328, 145,  -4), FILTER_VCOEF(  32, 317, 166,  -3), FILTER_VCOEF(  23, 304, 187,  -2),
264         FILTER_VCOEF(  16, 288, 209,  -1), FILTER_VCOEF(   9, 271, 231,   1), FILTER_VCOEF(   5, 251, 251,   5),
265     }, { // x4/8 Downsampling
266         FILTER_VCOEF( 104, 304, 104,   0), FILTER_VCOEF(  89, 302, 120,   1), FILTER_VCOEF(  76, 298, 136,   2),
267         FILTER_VCOEF(  63, 293, 153,   3), FILTER_VCOEF(  52, 285, 170,   5), FILTER_VCOEF(  42, 275, 188,   7),
268         FILTER_VCOEF(  33, 264, 205,  10), FILTER_VCOEF(  26, 251, 221,  14), FILTER_VCOEF(  20, 236, 236,  20),
269     }, { // x3/8 Downsampling
270         FILTER_VCOEF( 118, 276, 118,   0), FILTER_VCOEF( 103, 273, 129,   7), FILTER_VCOEF(  90, 270, 143,   9),
271         FILTER_VCOEF(  78, 266, 157,  11), FILTER_VCOEF(  67, 260, 171,  14), FILTER_VCOEF(  57, 253, 185,  17),
272         FILTER_VCOEF(  48, 244, 199,  21), FILTER_VCOEF(  40, 234, 211,  27), FILTER_VCOEF(  33, 223, 223,  33),
273     }, { // x2/8 Downsampling
274         FILTER_VCOEF( 127, 258, 127,   0), FILTER_VCOEF( 111, 252, 135,  14), FILTER_VCOEF( 100, 250, 147,  15),
275         FILTER_VCOEF(  88, 247, 159,  18), FILTER_VCOEF(  78, 242, 171,  21), FILTER_VCOEF(  68, 237, 182,  25),
276         FILTER_VCOEF(  59, 230, 193,  30), FILTER_VCOEF(  50, 222, 204,  36), FILTER_VCOEF(  43, 213, 213,  43),
277     }
278 };
279 
findFilterCoefficientsIndex(uint32_t factor)280 static unsigned int findFilterCoefficientsIndex(uint32_t factor)
281 {
282     static uint32_t choicetable[NUM_FILTER_COEF_SETS] = {
283         G2D_SCALE_FACTOR(8, 8), G2D_SCALE_FACTOR(8, 7), G2D_SCALE_FACTOR(8, 6), G2D_SCALE_FACTOR(8, 5),
284         G2D_SCALE_FACTOR(8, 4), G2D_SCALE_FACTOR(8, 3), G2D_SCALE_FACTOR(8, 2),
285     };
286 
287     for (unsigned int i = 0; i < NUM_FILTER_COEF_SETS; i++)
288         if (factor <= choicetable[i])
289             return i;
290     // if i == NUM_FILTER_COEF_SETS, the downsampling factor is larger than 4.0 which is not supported by the filter.
291     return NUM_FILTER_COEF_SETS - 1;
292 }
293 
294 template<typename CoefT>
__writeFilterCoefficients(CoefT & coef_set,unsigned int index,uint32_t base,g2d_reg regs[])295 static unsigned int __writeFilterCoefficients(CoefT &coef_set, unsigned int index, uint32_t base, g2d_reg regs[])
296 {
297     // The default value of filter coefficients are values of 8:8/zoom-in
298     // So, do not update redundantly.
299     if (index == 0)
300         return 0;
301 
302     unsigned int cnt = 0;
303 
304     for (auto &coef_table: coef_set[index]) {
305         uint32_t coef_base = base;
306         // register offsets of filter coeffcients are ordered by phase number then tab index
307         // while values are ordered by tab index then phase number in the above coefficients array.
308         // So register offset is increased by the number of tabs instead of 1.
309         // The coefficients array is specified in the order of tab index due to readability
310         // because the coefficient values are also specified in the same order in UM.
311         for (auto coef: coef_table) {
312             regs[cnt].offset = coef_base;
313             regs[cnt].value = coef;
314             coef_base += (sizeof(coef_set[index]) / sizeof(coef_table)) * sizeof(coef_table[0]);
315             cnt++;
316         }
317         base += sizeof(uint32_t);
318     }
319 
320     return cnt;
321 }
322 
getChromaScaleFactor(uint32_t colormode,unsigned int * hfactor,unsigned int * vfactor)323 void getChromaScaleFactor(uint32_t colormode, unsigned int *hfactor, unsigned int *vfactor)
324 {
325     switch (colormode & G2D_DATAFMT_MASK) {
326         case G2D_DATAFMT_YUV420SP:
327         case G2D_DATAFMT_YUV420P:
328             *hfactor /= 2;
329             [[fallthrough]];
330         case G2D_DATAFMT_YUV422SP:
331         case G2D_DATAFMT_YUV422I:
332             *vfactor /= 2;
333             break;
334         default:
335             break;
336     }
337 }
338 
writeFilterCoefficients(uint32_t hfactor,uint32_t vfactor,uint32_t colormode,unsigned layer_index,g2d_reg regs[])339 static unsigned int writeFilterCoefficients(uint32_t hfactor, uint32_t vfactor, uint32_t colormode,
340                                             unsigned layer_index, g2d_reg regs[])
341 {
342     unsigned int hindex = findFilterCoefficientsIndex(hfactor);
343     unsigned int vindex = findFilterCoefficientsIndex(vfactor);
344     // Filter coefficients of 1:1 and upsampling are configured to the filter by default (reset value)
345     if ((hindex == 0) && (vindex == 0))
346         return 0;
347 
348     unsigned int base = G2D_FILTER_COEF_REG(layer_index);
349     unsigned int cnt = 0;
350     // Y Coefficients
351     cnt += __writeFilterCoefficients(g2dVertFilterCoef, vindex, base, regs);
352     cnt += __writeFilterCoefficients(g2dHoriFilterCoef, hindex, base + sizeof(g2dVertFilterCoef[0]), regs + cnt);
353     if (IS_YUV(colormode)) {
354         // C Coefficients
355         getChromaScaleFactor(colormode, &hfactor, &vfactor);
356 
357         hindex = findFilterCoefficientsIndex(hfactor);
358         vindex = findFilterCoefficientsIndex(vfactor);
359         base += G2D_FILTER_C_OFFSET;
360         cnt += __writeFilterCoefficients(g2dVertFilterCoef, vindex, base, regs + cnt);
361         cnt += __writeFilterCoefficients(g2dHoriFilterCoef, hindex, base + sizeof(g2dVertFilterCoef[0]), regs + cnt);
362     }
363 
364     return cnt;
365 }
366 
getFilterCoefficientCount(uint32_t * src_cmds[],unsigned int layer_count)367 static unsigned int getFilterCoefficientCount(uint32_t *src_cmds[], unsigned int layer_count)
368 {
369     unsigned int count = 0;
370 
371 
372     for (unsigned int i = 0; i < layer_count; i++) {
373         unsigned int layer_coef_cnt = 0;
374         unsigned int hfactor = src_cmds[i][G2DSFR_SRC_XSCALE];
375         unsigned int vfactor = src_cmds[i][G2DSFR_SRC_YSCALE];
376 
377         if (hfactor > G2D_SCALE_FACTOR(8, 8))
378             layer_coef_cnt += NUM_HORI_COEF_REGS;
379         if (vfactor > G2D_SCALE_FACTOR(8, 8))
380             layer_coef_cnt += NUM_VERT_COEF_REGS;
381         if (IS_YUV(src_cmds[i][G2DSFR_IMG_COLORMODE])) {
382             getChromaScaleFactor(src_cmds[i][G2DSFR_IMG_COLORMODE], &hfactor, &vfactor);
383             if (hfactor > G2D_SCALE_FACTOR(8, 8))
384                 layer_coef_cnt += NUM_HORI_COEF_REGS;
385             if (vfactor > G2D_SCALE_FACTOR(8, 8))
386                 layer_coef_cnt += NUM_VERT_COEF_REGS;
387         }
388 
389         count += layer_coef_cnt;
390     }
391 
392     return count;
393 }
394 
show_g2d_layer(const char * title,int idx,const g2d_layer & layer)395 static void show_g2d_layer(const char *title, int idx, const g2d_layer &layer)
396 {
397     ALOGD("%s%d: flags %#x, fence %d, buffer_type %d, num_buffers %d", title, idx,
398           layer.flags, layer.fence, layer.buffer_type, layer.num_buffers);
399     for (unsigned int i = 0; i < layer.num_buffers; i++) {
400         ALOGD("         buf[%d] ptr %p, fd %d, offset %u, length %u",
401               i, layer.buffer[i].userptr,
402               layer.buffer[i].dmabuf.fd, layer.buffer[i].dmabuf.offset,
403               layer.buffer[i].length);
404     }
405 }
406 
show_g2d_commands(const g2d_commands & cmds)407 static void show_g2d_commands(const g2d_commands &cmds)
408 {
409     for (unsigned int i = 0; i < G2DSFR_DST_FIELD_COUNT; i++)
410         ALOGD("DST[%02d]: %#010x", i, cmds.target[i]);
411 
412     for (unsigned int idx = 0; idx < G2D_MAX_IMAGES; idx++) {
413         if (cmds.source[idx]) {
414             for (unsigned int i = 0; i < G2DSFR_SRC_FIELD_COUNT; i++)
415                 ALOGD("SRC[%02d][%02d]: %#010x", idx, i, cmds.source[idx][i]);
416         }
417     }
418 
419     if (cmds.extra) {
420         for (unsigned int i = 0; i < cmds.num_extra_regs; i++)
421             ALOGD("EXTRA: offset %#010x, value %#010x",
422                   cmds.extra[i].offset, cmds.extra[i].value);
423     }
424 }
425 
show_g2d_task(const g2d_task & task)426 static void show_g2d_task(const g2d_task &task)
427 {
428     ALOGD("Showing the content of G2D task descriptor ver %#010x", task.version);
429     ALOGD("source count %d, flags %#x, priority %d, num_release_fences %d",
430           task.num_source, task.flags, task.priority, task.num_release_fences);
431     show_g2d_layer("Target", 0, task.target);
432     for (unsigned int i = 0; i < task.num_source; i++)
433         show_g2d_layer("Source", i, task.source[i]);
434     show_g2d_commands(task.commands);
435 }
436 
437 #ifdef LIBACRYL_DEBUG
debug_show_g2d_task(const g2d_task & task)438 static void debug_show_g2d_task(const g2d_task &task)
439 {
440     ALOGD("Showing the content of G2D task descriptor ver %#010x", task.version);
441     ALOGD("source count %d, flags %#x, priority %d, num_release_fences %d",
442           task.num_source, task.flags, task.priority, task.num_release_fences);
443     show_g2d_layer("Target", 0, task.target);
444     for (unsigned int i = 0; i < task.num_source; i++)
445         show_g2d_layer("Source", i, task.source[i]);
446     show_g2d_commands(task.commands);
447 }
448 #else
449 #define debug_show_g2d_task(task) do { } while (0)
450 #endif
451 
452 struct g2d_fmt {
453     uint32_t halfmt;
454     uint32_t g2dfmt;
455     uint32_t num_bufs;
456     uint32_t rgb_bpp;
457 };
458 
459 static g2d_fmt __halfmt_to_g2dfmt_legacy[] = {
460 //  {halfmt,                                      g2dfmt,  num_buffers, rgbbpp}
461     {HAL_PIXEL_FORMAT_RGBA_8888,                  G2D_FMT_ABGR8888,  1, 4},
462     {HAL_PIXEL_FORMAT_BGRA_8888,                  G2D_FMT_ARGB8888,  1, 4},
463     {HAL_PIXEL_FORMAT_RGBX_8888,                  G2D_FMT_XBGR8888,  1, 4},
464     {HAL_PIXEL_FORMAT_RGBA_1010102,               G2D_FMT_ABGR2101010, 1, 4},
465     {HAL_PIXEL_FORMAT_RGB_888,                    G2D_FMT_RGB888,    1, 3},
466     {HAL_PIXEL_FORMAT_RGB_565,                    G2D_FMT_RGB565,    1, 2},
467 //  {HAL_PIXEL_FORMAT_YV12,                       G2D_FMT_YV12,      1, 0},
468 //  {HAL_PIXEL_FORMAT_EXYNOS_YV12_M,              G2D_FMT_YV12,      3, 0},
469     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_P,         G2D_FMT_YV12,      1, 0},
470     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_PN,        G2D_FMT_YV12,      1, 0},
471     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_P_M,       G2D_FMT_YV12,      3, 0},
472     {HAL_PIXEL_FORMAT_YCrCb_420_SP,               G2D_FMT_NV21,      1, 0},
473     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M,      G2D_FMT_NV21,      2, 0},
474     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M_FULL, G2D_FMT_NV21,      2, 0},
475     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP,        G2D_FMT_NV12,      1, 0},
476     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M,      G2D_FMT_NV12,      2, 0},
477     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN,       G2D_FMT_NV12,      1, 0},
478     {HAL_PIXEL_FORMAT_YCBCR_P010,                 G2D_FMT_NV12_P010_LGCY, 1, 0},
479     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_P010_M,        G2D_FMT_NV12_P010_LGCY, 2, 0},
480     {HAL_PIXEL_FORMAT_YCbCr_422_I,                G2D_FMT_YUYV,      1, 0},
481     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_422_I,         G2D_FMT_YVYU,      1, 0},
482     {HAL_PIXEL_FORMAT_YCbCr_422_SP,               G2D_FMT_NV16,      1, 0},
483     // TODO: add p010
484 };
485 
486 static g2d_fmt __halfmt_to_g2dfmt[] = {
487 //  {halfmt,                                      g2dfmt,  num_buffers, rgbbpp}
488     {HAL_PIXEL_FORMAT_RGBA_8888,                  G2D_FMT_ABGR8888,  1, 4},
489     {HAL_PIXEL_FORMAT_BGRA_8888,                  G2D_FMT_ARGB8888,  1, 4},
490     {HAL_PIXEL_FORMAT_RGBX_8888,                  G2D_FMT_XBGR8888,  1, 4},
491     {HAL_PIXEL_FORMAT_RGBA_1010102,               G2D_FMT_ABGR2101010, 1, 4},
492     {HAL_PIXEL_FORMAT_RGB_888,                    G2D_FMT_RGB888,    1, 3},
493     {HAL_PIXEL_FORMAT_RGB_565,                    G2D_FMT_RGB565,    1, 2},
494     {HAL_PIXEL_FORMAT_YV12,                       G2D_FMT_YV12,      1, 0},
495     {HAL_PIXEL_FORMAT_EXYNOS_YV12_M,              G2D_FMT_YV12,      3, 0},
496     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_P,         G2D_FMT_YUV420P,   1, 0},
497     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_PN,        G2D_FMT_YUV420P,   1, 0},
498     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_P_M,       G2D_FMT_YUV420P,   3, 0},
499     {HAL_PIXEL_FORMAT_YCrCb_420_SP,               G2D_FMT_NV21,      1, 0},
500     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M,      G2D_FMT_NV21,      2, 0},
501     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M_FULL, G2D_FMT_NV21,      2, 0},
502     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP,        G2D_FMT_NV12,      1, 0},
503     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M,      G2D_FMT_NV12,      2, 0},
504     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN,       G2D_FMT_NV12,      1, 0},
505     {HAL_PIXEL_FORMAT_GOOGLE_NV12_SP,             G2D_FMT_NV12,      1, 0},
506     {MALI_GRALLOC_FORMAT_INTERNAL_YUV420_8BIT_I,  G2D_FMT_NV12,      1, 0},
507     {HAL_PIXEL_FORMAT_YCBCR_P010,                 G2D_FMT_NV12_P010, 1, 0},
508     {HAL_PIXEL_FORMAT_GOOGLE_NV12_SP_10B,         G2D_FMT_NV12_P010, 1, 0},
509     {MALI_GRALLOC_FORMAT_INTERNAL_YUV420_10BIT_I, G2D_FMT_NV12_P010, 1, 0},
510     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_P010_M,        G2D_FMT_NV12_P010, 2, 0},
511     {HAL_PIXEL_FORMAT_YCbCr_422_I,                G2D_FMT_YUYV,      1, 0},
512     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_422_I,         G2D_FMT_YVYU,      1, 0},
513     {HAL_PIXEL_FORMAT_YCbCr_422_SP,               G2D_FMT_NV16,      1, 0},
514     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_SBWC,     G2D_FMT_NV12_SBWC, 2, 0},
515     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_SBWC,      G2D_FMT_NV12_SBWC, 1, 0},
516     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC, G2D_FMT_NV12_SBWC_10B, 2, 0},
517     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_10B_SBWC,  G2D_FMT_NV12_SBWC_10B, 1, 0},
518     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M_SBWC,     G2D_FMT_NV21_SBWC, 2, 0},
519     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M_10B_SBWC, G2D_FMT_NV21_SBWC_10B, 2, 0},
520     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_SBWC_L50, G2D_FMT_NV12_SBWC, 2, 0},
521     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC_L40, G2D_FMT_NV12_SBWC_10B, 2, 0},
522     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC_L80, G2D_FMT_NV12_SBWC_10B, 2, 0},
523     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_SBWC_L50, G2D_FMT_NV12_SBWC, 2, 0},
524     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_SBWC_L50, G2D_FMT_NV12_SBWC, 1, 0},
525     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_SBWC_L75, G2D_FMT_NV12_SBWC, 2,0},
526     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_SBWC_L75, G2D_FMT_NV12_SBWC, 1,0},
527     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC_L40, G2D_FMT_NV12_SBWC_10B, 2, 0},
528     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_10B_SBWC_L40, G2D_FMT_NV12_SBWC_10B, 1, 0},
529     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC_L60, G2D_FMT_NV12_SBWC_10B, 2,0},
530     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_10B_SBWC_L60, G2D_FMT_NV12_SBWC_10B, 1,0},
531     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC_L80, G2D_FMT_NV12_SBWC_10B, 2,0},
532     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_10B_SBWC_L80, G2D_FMT_NV12_SBWC_10B, 1,0},
533 };
534 
halfmt_to_g2dfmt(struct g2d_fmt * tbl,size_t tbl_len,uint32_t halfmt)535 static g2d_fmt *halfmt_to_g2dfmt(struct g2d_fmt *tbl, size_t tbl_len, uint32_t halfmt)
536 {
537     for (size_t i = 0 ; i < tbl_len; i++) {
538         if (tbl[i].halfmt == halfmt)
539             return &tbl[i];
540     }
541 
542     ALOGE("Unable to find the proper G2D format for HAL format %#x", halfmt);
543 
544     return NULL;
545 }
546 
AcrylicCompositorG2D(const HW2DCapability & capability,bool newcolormode)547 AcrylicCompositorG2D::AcrylicCompositorG2D(const HW2DCapability &capability, bool newcolormode)
548     : Acrylic(capability), mDev((capability.maxLayerCount() > 2) ? "/dev/g2d" : "/dev/fimg2d"),
549       mMaxSourceCount(0), mPriority(-1)
550 {
551     memset(&mTask, 0, sizeof(mTask));
552 
553     mVersion = 0;
554     if (mDev.ioctl(G2D_IOC_VERSION, &mVersion) < 0)
555         ALOGERR("Failed to get G2D command version");
556     ALOGI("G2D API Version %d", mVersion);
557 
558     halfmt_to_g2dfmt_tbl = newcolormode ? __halfmt_to_g2dfmt : __halfmt_to_g2dfmt_legacy;
559     len_halfmt_to_g2dfmt_tbl = newcolormode ? ARRSIZE(__halfmt_to_g2dfmt) : ARRSIZE(__halfmt_to_g2dfmt_legacy);
560 
561     mUsePolyPhaseFilter = getCapabilities().supportedMinDecimation() == hw2d_coord_t{4, 4};
562 
563     ALOGD_TEST("Created a new Acrylic for G2D on %p", this);
564 }
565 
~AcrylicCompositorG2D()566 AcrylicCompositorG2D::~AcrylicCompositorG2D()
567 {
568     delete [] mTask.source;
569     delete [] mTask.commands.target;
570     for (unsigned int i = 0; i < mMaxSourceCount; i++)
571         delete [] mTask.commands.source[i];
572 
573     ALOGD_TEST("Deleting Acrylic for G2D on %p", this);
574 }
575 
updateFilterCoefficients(unsigned int layercount,g2d_reg regs[])576 unsigned int AcrylicCompositorG2D::updateFilterCoefficients(unsigned int layercount, g2d_reg regs[])
577 {
578     if (!mUsePolyPhaseFilter)
579         return 0;
580 
581     unsigned int cnt = 0;
582 
583     for (unsigned int i = 0; i < layercount; i++)
584         cnt += writeFilterCoefficients(mTask.commands.source[i][G2DSFR_SRC_XSCALE],
585                                        mTask.commands.source[i][G2DSFR_SRC_YSCALE],
586                                        mTask.commands.source[i][G2DSFR_IMG_COLORMODE],
587                                        i, regs + cnt);
588 
589     return cnt;
590 }
591 
592 #define SBWC_BLOCK_WIDTH 32
593 #define SBWC_BLOCK_HEIGHT 4
594 #define SBWC_BLOCK_SIZE(bit) (SBWC_BLOCK_WIDTH * SBWC_BLOCK_HEIGHT * (bit) / 8)
595 
596 #define SBWC_HEADER_ALIGN 16
597 #define SBWC_PAYLOAD_ALIGN 32
598 
599 #define SBWC_HEADER_STRIDE(w) \
600 	ALIGN(((w) / SBWC_BLOCK_WIDTH / 2), SBWC_HEADER_ALIGN)
601 #define SBWC_PAYLOAD_STRIDE(w, dep)\
602 	ALIGN(((w) / SBWC_BLOCK_WIDTH) * SBWC_BLOCK_SIZE(dep), \
603 	      SBWC_PAYLOAD_ALIGN)
604 
605 #define SBWC_LOSSY_PAYLOAD_STRIDE(w, block_byte) \
606 	ALIGN(((w) / SBWC_BLOCK_WIDTH) * (block_byte), \
607 	      SBWC_PAYLOAD_ALIGN)
608 
609 static uint32_t mfc_stride_formats[] = {
610     HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN,
611     HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_SBWC,
612     HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_SBWC,
613     HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC,
614     HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_10B_SBWC,
615     HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M_SBWC,
616     HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M_10B_SBWC,
617 };
618 
619 struct lossy_formats {
620         unsigned int halfmt;
621         unsigned int blocksize;
622 };
623 
624 static lossy_formats sbwc_lossy_formats[] {
625    {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_SBWC_L50,            64},
626    {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC_L40,        64},
627    {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_SBWC_L50,             64},
628    {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_10B_SBWC_L40,          64},
629    {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_SBWC_L75,             96},
630    {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC_L60,         96},
631    {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_SBWC_L75,              96},
632    {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_10B_SBWC_L60,          96},
633    {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC_L80,         128},
634    {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_10B_SBWC_L80,          128},
635 };
636 
637 
prepareImage(AcrylicCanvas & layer,struct g2d_layer & image,uint32_t cmd[],int index)638 bool AcrylicCompositorG2D::prepareImage(AcrylicCanvas &layer, struct g2d_layer &image, uint32_t cmd[], int index)
639 {
640     image.flags = 0;
641 
642     if (layer.getFence() >= 0) {
643         image.flags |= G2D_LAYERFLAG_ACQUIRE_FENCE;
644         image.fence = layer.getFence();
645     }
646 
647     if (layer.isProtected())
648         image.flags |= G2D_LAYERFLAG_SECURE;
649 
650     g2d_fmt *g2dfmt = halfmt_to_g2dfmt(halfmt_to_g2dfmt_tbl, len_halfmt_to_g2dfmt_tbl, layer.getFormat());
651     if (!g2dfmt)
652         return false;
653 
654     image.flags &= ~G2D_LAYERFLAG_MFC_STRIDE;
655     for (size_t i = 0; i < ARRSIZE(mfc_stride_formats); i++) {
656         if (layer.getFormat() == mfc_stride_formats[i]) {
657             image.flags |= G2D_LAYERFLAG_MFC_STRIDE;
658             break;
659         }
660     }
661 
662     if (layer.getBufferType() == AcrylicCanvas::MT_EMPTY) {
663         image.buffer_type = G2D_BUFTYPE_EMPTY;
664     } else {
665         if (layer.getBufferCount() < g2dfmt->num_bufs) {
666             ALOGE("HAL Format %#x requires %d buffers but %d buffers are given",
667                     layer.getFormat(), g2dfmt->num_bufs, layer.getBufferCount());
668             return false;
669         }
670 
671         if (layer.getBufferType() == AcrylicCanvas::MT_DMABUF) {
672             image.buffer_type = G2D_BUFTYPE_DMABUF;
673             for (unsigned int i = 0; i < g2dfmt->num_bufs; i++) {
674                 image.buffer[i].dmabuf.fd = layer.getDmabuf(i);
675                 image.buffer[i].dmabuf.offset = layer.getOffset(i);
676                 image.buffer[i].length = layer.getBufferLength(i);
677             }
678         } else {
679             LOGASSERT(layer.getBufferType() == AcrylicCanvas::MT_USERPTR,
680                       "Unknown buffer type %d", layer.getBufferType());
681             image.buffer_type = G2D_BUFTYPE_USERPTR;
682             for (unsigned int i = 0; i < g2dfmt->num_bufs; i++) {
683                 image.buffer[i].userptr = layer.getUserptr(i);
684                 image.buffer[i].length = layer.getBufferLength(i);
685             }
686         }
687     }
688 
689     image.num_buffers = g2dfmt->num_bufs;
690 
691     hw2d_coord_t xy = layer.getImageDimension();
692 
693     cmd[G2DSFR_IMG_COLORMODE] = g2dfmt->g2dfmt;
694     if (layer.isUOrder())
695         cmd[G2DSFR_IMG_COLORMODE] |= G2D_DATAFORMAT_UORDER;
696 
697     if (layer.isCompressed()) {
698         // AFBC forces RGB swizzling order to BGR for RGB565
699         if (g2dfmt->g2dfmt == G2D_FMT_RGB565)
700             cmd[G2DSFR_IMG_COLORMODE] = G2D_FMT_BGR565;
701         cmd[G2DSFR_IMG_COLORMODE] |= G2D_DATAFORMAT_AFBC;
702         cmd[G2DSFR_IMG_STRIDE] = 0;
703     } else if (g2dfmt->g2dfmt & G2D_DATAFORMAT_SBWC) {
704         cmd[G2DSFR_IMG_STRIDE] = 0;
705     } else {
706         cmd[G2DSFR_IMG_STRIDE] = g2dfmt->rgb_bpp * xy.hori;
707     }
708 
709     unsigned int payload = 0, header = 0, lossyByteNum = 0;
710 
711     if (g2dfmt->g2dfmt & G2D_DATAFORMAT_SBWC) {
712         unsigned int blocksize;
713         unsigned int isLossy = 0;
714         unsigned int format = layer.getFormat();
715 
716         for (unsigned int i = 0; i < ARRSIZE(sbwc_lossy_formats); i++) {
717             if (format == sbwc_lossy_formats[i].halfmt) {
718                 isLossy = 1;
719                 blocksize = sbwc_lossy_formats[i].blocksize;
720                 break;
721             }
722         }
723 
724         if (isLossy) {
725             lossyByteNum = (blocksize >> 1) | isLossy;
726             payload = SBWC_LOSSY_PAYLOAD_STRIDE(xy.hori, blocksize);
727         } else {
728             payload = SBWC_PAYLOAD_STRIDE(xy.hori, (g2dfmt->g2dfmt & G2D_FMT_YCBCR_10BIT) ? 10 : 8);
729             header = SBWC_HEADER_STRIDE(xy.hori);
730         }
731     }
732 
733     if (index < 0) {
734         cmd[G2DSFR_DST_Y_HEADER_STRIDE] = header;
735         cmd[G2DSFR_DST_C_HEADER_STRIDE] = header;
736         cmd[G2DSFR_DST_Y_PAYLOAD_STRIDE] = payload;
737         cmd[G2DSFR_DST_C_PAYLOAD_STRIDE] = payload;
738         cmd[G2DSFR_DST_SBWCINFO] = lossyByteNum;
739     } else {
740         cmd[G2DSFR_SRC_Y_HEADER_STRIDE] = header;
741         cmd[G2DSFR_SRC_C_HEADER_STRIDE] = header;
742         cmd[G2DSFR_SRC_Y_PAYLOAD_STRIDE] = payload;
743         cmd[G2DSFR_SRC_C_PAYLOAD_STRIDE] = payload;
744         cmd[G2DSFR_SRC_SBWCINFO] = lossyByteNum;
745     }
746 
747     cmd[G2DSFR_IMG_LEFT]   = 0;
748     cmd[G2DSFR_IMG_TOP]    = 0;
749     cmd[G2DSFR_IMG_RIGHT]  = xy.hori;
750     cmd[G2DSFR_IMG_BOTTOM] = xy.vert;
751     cmd[G2DSFR_IMG_WIDTH]  = xy.hori;
752     cmd[G2DSFR_IMG_HEIGHT] = xy.vert;
753 
754     return true;
755 }
756 
setSolidLayer(struct g2d_layer & image,uint32_t cmd[],hw2d_coord_t xy)757 static void setSolidLayer(struct g2d_layer &image, uint32_t cmd[], hw2d_coord_t xy)
758 {
759     image.flags = G2D_LAYERFLAG_COLORFILL;
760     image.buffer_type = G2D_BUFTYPE_EMPTY;
761     image.num_buffers = 0;
762 
763     cmd[G2DSFR_IMG_COLORMODE] = G2D_FMT_ARGB8888;
764     cmd[G2DSFR_IMG_STRIDE] = 4 * xy.hori;
765 
766     cmd[G2DSFR_IMG_WIDTH]  = xy.hori;
767     cmd[G2DSFR_IMG_HEIGHT] = xy.vert;
768 
769     cmd[G2DSFR_SRC_SELECT] = G2D_LAYERSEL_COLORFILL;
770     cmd[G2DSFR_SRC_COMMAND] = G2D_LAYERCMD_VALID;
771 
772     cmd[G2DSFR_SRC_ROTATE] = 0;
773     cmd[G2DSFR_SRC_SCALECONTROL] = 0;
774     cmd[G2DSFR_SRC_XSCALE] = G2D_SCALE_FACTOR(1, 1);
775     cmd[G2DSFR_SRC_YSCALE] = G2D_SCALE_FACTOR(1, 1);
776     cmd[G2DSFR_SRC_XPHASE] = 0;
777     cmd[G2DSFR_SRC_YPHASE] = 0;
778     cmd[G2DSFR_SRC_YCBCRMODE] = 0;
779     cmd[G2DSFR_SRC_HDRMODE] = 0;
780     cmd[G2DSFR_SRC_Y_HEADER_STRIDE] = 0;
781     cmd[G2DSFR_SRC_C_HEADER_STRIDE] = 0;
782     cmd[G2DSFR_SRC_Y_PAYLOAD_STRIDE] = 0;
783     cmd[G2DSFR_SRC_C_PAYLOAD_STRIDE] = 0;
784     cmd[G2DSFR_SRC_SBWCINFO] = 0;
785 }
786 
prepareSolidLayer(AcrylicCanvas & canvas,struct g2d_layer & image,uint32_t cmd[])787 bool AcrylicCompositorG2D::prepareSolidLayer(AcrylicCanvas &canvas, struct g2d_layer &image, uint32_t cmd[])
788 {
789     hw2d_coord_t xy = canvas.getImageDimension();
790 
791     setSolidLayer(image, cmd, xy);
792 
793     uint16_t a, r, g, b;
794     getBackgroundColor(&r, &g, &b, &a);
795 
796     cmd[G2DSFR_SRC_COLOR]  = (a & 0xFF00) << 16;
797     cmd[G2DSFR_SRC_COLOR] |= (r & 0xFF00) << 8;
798     cmd[G2DSFR_SRC_COLOR] |= (g & 0xFF00) << 0;
799     cmd[G2DSFR_SRC_COLOR] |= (b & 0xFF00) >> 8;
800 
801     cmd[G2DSFR_IMG_LEFT]   = 0;
802     cmd[G2DSFR_IMG_TOP]    = 0;
803     cmd[G2DSFR_IMG_RIGHT]  = xy.hori;
804     cmd[G2DSFR_IMG_BOTTOM] = xy.vert;
805 
806     cmd[G2DSFR_SRC_DSTLEFT]   = 0;
807     cmd[G2DSFR_SRC_DSTTOP]    = 0;
808     cmd[G2DSFR_SRC_DSTRIGHT]  = xy.hori;
809     cmd[G2DSFR_SRC_DSTBOTTOM] = xy.vert;
810 
811     cmd[G2DSFR_SRC_ALPHA] = 0;
812     cmd[G2DSFR_SRC_BLEND] = 0;
813 
814     return true;
815 }
816 
prepareSolidLayer(AcrylicLayer & layer,struct g2d_layer & image,uint32_t cmd[],hw2d_coord_t target_size,unsigned int index)817 bool AcrylicCompositorG2D::prepareSolidLayer(AcrylicLayer &layer, struct g2d_layer &image, uint32_t cmd[], hw2d_coord_t target_size, unsigned int index)
818 {
819     hw2d_coord_t xy = layer.getImageDimension();
820 
821     setSolidLayer(image, cmd, xy);
822 
823     cmd[G2DSFR_SRC_COLOR]  = layer.getSolidColor();
824 
825     hw2d_rect_t crop = layer.getImageRect();
826     cmd[G2DSFR_IMG_LEFT]   = crop.pos.hori;
827     cmd[G2DSFR_IMG_TOP]    = crop.pos.vert;
828     cmd[G2DSFR_IMG_RIGHT]  = crop.size.hori + crop.pos.hori;
829     cmd[G2DSFR_IMG_BOTTOM] = crop.size.vert + crop.pos.vert;
830 
831     hw2d_rect_t window = layer.getTargetRect();
832     if (area_is_zero(window))
833         window.size = target_size;
834     cmd[G2DSFR_SRC_DSTLEFT]   = window.pos.hori;
835     cmd[G2DSFR_SRC_DSTTOP]    = window.pos.vert;
836     cmd[G2DSFR_SRC_DSTRIGHT]  = window.size.hori + window.pos.hori;
837     cmd[G2DSFR_SRC_DSTBOTTOM] = window.size.vert + window.pos.vert;
838 
839     uint8_t alpha = layer.getPlaneAlpha();
840     cmd[G2DSFR_SRC_ALPHA] = (alpha << 24) | (alpha << 16) | (alpha << 8) | alpha;
841     if ((layer.getCompositingMode() == HWC_BLENDING_PREMULT) ||
842             (layer.getCompositingMode() == HWC2_BLEND_MODE_PREMULTIPLIED)) {
843         cmd[G2DSFR_SRC_BLEND] = G2D_BLEND_SRCOVER;
844     } else if ((layer.getCompositingMode() == HWC_BLENDING_COVERAGE) ||
845                (layer.getCompositingMode() == HWC2_BLEND_MODE_COVERAGE)) {
846         cmd[G2DSFR_SRC_BLEND] = G2D_BLEND_NONE;
847     } else {
848         cmd[G2DSFR_SRC_BLEND] = G2D_BLEND_SRCCOPY;
849     }
850 
851     /* bottom layer always is opaque */
852     if (index == 0) {
853        cmd[G2DSFR_SRC_COMMAND] |= G2D_LAYERCMD_OPAQUE;
854        if (alpha < 255)
855            cmd[G2DSFR_SRC_COMMAND] |= G2D_LAYERCMD_PREMULT_GLOBALALPHA;
856     } else {
857        cmd[G2DSFR_SRC_COMMAND] |= G2D_LAYERCMD_ALPHABLEND;
858     }
859 
860     return true;
861 }
862 
prepareSource(AcrylicLayer & layer,struct g2d_layer & image,uint32_t cmd[],hw2d_coord_t target_size,unsigned int index,unsigned int image_index)863 bool AcrylicCompositorG2D::prepareSource(AcrylicLayer &layer, struct g2d_layer &image, uint32_t cmd[],
864                                              hw2d_coord_t target_size, unsigned int index, unsigned int image_index)
865 {
866     if (layer.isSolidColor()) {
867         prepareSolidLayer(layer, image, cmd, target_size, image_index);
868 
869         return true;
870     }
871 
872     if (!prepareImage(layer, image, cmd, index))
873         return false;
874 
875     cmd[G2DSFR_SRC_SELECT] = 0;
876 
877     hw2d_rect_t crop = layer.getImageRect();
878     cmd[G2DSFR_IMG_LEFT]   = crop.pos.hori;
879     cmd[G2DSFR_IMG_TOP]    = crop.pos.vert;
880     cmd[G2DSFR_IMG_RIGHT]  = crop.size.hori + crop.pos.hori;
881     cmd[G2DSFR_IMG_BOTTOM] = crop.size.vert + crop.pos.vert;
882 
883     hw2d_rect_t window = layer.getTargetRect();
884     if (area_is_zero(window))
885         window.size = target_size;
886     cmd[G2DSFR_SRC_DSTLEFT]   = window.pos.hori;
887     cmd[G2DSFR_SRC_DSTTOP]    = window.pos.vert;
888     cmd[G2DSFR_SRC_DSTRIGHT]  = window.size.hori + window.pos.hori;
889     cmd[G2DSFR_SRC_DSTBOTTOM] = window.size.vert + window.pos.vert;
890 
891     if (layer.isCompressed()) {
892         cmd[G2DSFR_IMG_WIDTH]--;
893         cmd[G2DSFR_IMG_HEIGHT]--;
894     }
895 
896     cmd[G2DSFR_SRC_ROTATE] = 0;
897     // HAL FLIP value: FLIP_H=0x01, FLIP_V=0x02
898     // G2D FLIP value: FLIP_Y=0x05, FLIP_X=0x04
899     unsigned int flip = layer.getTransform() & (HAL_TRANSFORM_FLIP_H | HAL_TRANSFORM_FLIP_V);
900     if (!!(layer.getTransform() & HAL_TRANSFORM_ROT_90)) {
901         window.size.swap();
902 
903         cmd[G2DSFR_SRC_ROTATE] |= G2D_ROTATEDIR_ROT90CCW;
904         if (!flip || (flip == (HAL_TRANSFORM_FLIP_H | HAL_TRANSFORM_FLIP_V)))
905             flip = ~flip & (HAL_TRANSFORM_FLIP_H | HAL_TRANSFORM_FLIP_V);
906     }
907 
908     cmd[G2DSFR_SRC_ROTATE] |= flip << G2D_ROTATEDIR_FLIP_SHIFT;
909 
910     cmd[G2DSFR_SRC_XSCALE] = G2D_SCALE_FACTOR(crop.size.hori, window.size.hori);
911     cmd[G2DSFR_SRC_YSCALE] = G2D_SCALE_FACTOR(crop.size.vert, window.size.vert);
912     // Configure interpolation only if it is required.
913     // Otherwise, G2D needs more bandwidth because it interpolates pixels
914     // even though it is not required.
915     if ((cmd[G2DSFR_SRC_XSCALE] | cmd[G2DSFR_SRC_YSCALE]) == G2D_SCALE_FACTOR(1, 1))
916         cmd[G2DSFR_SRC_SCALECONTROL] = 0;
917     else if (mUsePolyPhaseFilter)
918         cmd[G2DSFR_SRC_SCALECONTROL] = (index << G2D_SCALECONTROL_FILTERCOEF_SHIFT) | G2D_SCALECONTROL_POLYPHASE;
919     else
920         cmd[G2DSFR_SRC_SCALECONTROL] = G2D_SCALECONTROL_BILINEAR;
921 
922     // TODO: Configure initial phases according to the scale factors
923      cmd[G2DSFR_SRC_XPHASE] = 0;
924      cmd[G2DSFR_SRC_YPHASE] = 0;
925 
926     uint8_t alpha = layer.getPlaneAlpha();
927     cmd[G2DSFR_SRC_ALPHA] = (alpha << 24) | (alpha << 16) | (alpha << 8) | alpha;
928     if ((layer.getCompositingMode() == HWC_BLENDING_PREMULT) ||
929             (layer.getCompositingMode() == HWC2_BLEND_MODE_PREMULTIPLIED)) {
930         cmd[G2DSFR_SRC_BLEND] = G2D_BLEND_SRCOVER;
931     } else if ((layer.getCompositingMode() == HWC_BLENDING_COVERAGE) ||
932                (layer.getCompositingMode() == HWC2_BLEND_MODE_COVERAGE)) {
933         cmd[G2DSFR_SRC_BLEND] = G2D_BLEND_NONE;
934     } else {
935         cmd[G2DSFR_SRC_BLEND] = G2D_BLEND_SRCCOPY;
936 
937         // HWC_BLEND_NONE is used not to appear its lower layer to target layer.
938         // But, when G2D output is reused by DPU, lower layer could appear to target layer.
939         // To prevent this, when blend mode is HWC_BLEND_NONE, make alpha channel max.
940         // Example case is as follow.
941         // If G2D composites several layers and topmost layer is HWC_BLEND_NONE
942         // and has alpha lower than max, that alpha value remains in target buffer.
943         // And if this result layer is recomposited with lower layer by DPU
944         // lower layer color appears to final result layer.
945         if ((cmd[G2DSFR_IMG_COLORMODE] == G2D_FMT_ABGR8888) ||
946             (cmd[G2DSFR_IMG_COLORMODE] == G2D_FMT_ARGB8888) ||
947             (cmd[G2DSFR_IMG_COLORMODE] == G2D_FMT_ABGR2101010)) {
948             cmd[G2DSFR_IMG_COLORMODE] &= ~G2D_SWZ_ALPHA_MASK;
949             cmd[G2DSFR_IMG_COLORMODE] |= G2D_SWZ_ALPHA_ONE;
950         }
951     }
952 
953     cmd[G2DSFR_SRC_COMMAND] = G2D_LAYERCMD_VALID;
954 
955     /* bottom layer always is opaque */
956     if (image_index == 0) {
957        cmd[G2DSFR_SRC_COMMAND] |= G2D_LAYERCMD_OPAQUE;
958        if (alpha < 255)
959            cmd[G2DSFR_SRC_COMMAND] |= G2D_LAYERCMD_PREMULT_GLOBALALPHA;
960     } else {
961        cmd[G2DSFR_SRC_COMMAND] |= G2D_LAYERCMD_ALPHABLEND;
962     }
963 
964     cmd[G2DSFR_SRC_YCBCRMODE] = 0;
965     cmd[G2DSFR_SRC_HDRMODE] = 0;
966 
967     return true;
968 }
969 
reallocLayer(unsigned int layercount)970 bool AcrylicCompositorG2D::reallocLayer(unsigned int layercount)
971 {
972     if (mMaxSourceCount >= layercount)
973         return true;
974 
975     if (!mTask.commands.target) {
976         mTask.commands.target = new uint32_t[G2DSFR_DST_FIELD_COUNT];
977         if (!mTask.commands.target) {
978             ALOGE("Failed to allocate command buffer for target image");
979             return false;
980         }
981 
982 	memset(mTask.commands.target, 0, sizeof(uint32_t) * G2DSFR_DST_FIELD_COUNT);
983     }
984 
985     delete [] mTask.source;
986     for (unsigned int i = 0; i < mMaxSourceCount; i++)
987         delete [] mTask.commands.source[i];
988 
989     mMaxSourceCount = 0;
990 
991     mTask.source = new g2d_layer[layercount];
992     if (!mTask.source) {
993         ALOGE("Failed to allocate %u source image descriptors", layercount);
994         return false;
995     }
996 
997     for (unsigned int i = 0; i < layercount; i++) {
998         mTask.commands.source[i] = new uint32_t[G2DSFR_SRC_FIELD_COUNT];
999         if (mTask.commands.source[i] == NULL) {
1000             ALOGE("Failed to allocate command buffer for source image");
1001             while (i-- > 0)
1002                 delete [] mTask.commands.source[i];
1003 
1004             delete [] mTask.source;
1005             mTask.source = NULL;
1006 
1007             return false;
1008         }
1009 
1010 	memset(mTask.commands.source[i], 0, sizeof(uint32_t) * G2DSFR_SRC_FIELD_COUNT);
1011     }
1012 
1013     mMaxSourceCount = layercount;
1014 
1015     return true;
1016 }
1017 
ioctlG2D(void)1018 int AcrylicCompositorG2D::ioctlG2D(void)
1019 {
1020     if (mVersion == 1) {
1021         if (mDev.ioctl(G2D_IOC_PROCESS, &mTask) < 0)
1022             return -errno;
1023     } else {
1024         struct g2d_compat_task task;
1025 
1026         memcpy(&task, &mTask, sizeof(mTask) - sizeof(mTask.commands));
1027         memcpy(task.commands.target, mTask.commands.target, sizeof(task.commands.target));
1028 
1029         for (unsigned int i = 0; i < mMaxSourceCount; i++)
1030             task.commands.source[i] = mTask.commands.source[i];
1031 
1032         task.commands.extra = mTask.commands.extra;
1033         task.commands.num_extra_regs = mTask.commands.num_extra_regs;
1034 
1035         if (mDev.ioctl(G2D_IOC_COMPAT_PROCESS, &task) < 0)
1036             return -errno;
1037 
1038         mTask.flags = task.flags;
1039         mTask.laptime_in_usec = task.laptime_in_usec;
1040 
1041         for (unsigned int i = 0; i < mTask.num_release_fences; i++)
1042             mTask.release_fence[i] = task.release_fence[i];
1043     }
1044 
1045     return 0;
1046 }
1047 
executeG2D(int fence[],unsigned int num_fences,bool nonblocking)1048 bool AcrylicCompositorG2D::executeG2D(int fence[], unsigned int num_fences, bool nonblocking)
1049 {
1050     ATRACE_CALL();
1051     if (!validateAllLayers())
1052         return false;
1053 
1054     unsigned int layercount = layerCount();
1055 
1056     // Set invalid fence fd to the entries exceeds the number of source and destination images
1057     for (unsigned int i = layercount; i < num_fences; i++)
1058         fence[i] = -1;
1059 
1060     if (num_fences > layercount + 1)
1061         num_fences = layercount + 1;
1062 
1063     bool hasBackground = hasBackgroundColor();
1064 
1065     g2d_fmt *g2dfmt = halfmt_to_g2dfmt(halfmt_to_g2dfmt_tbl, len_halfmt_to_g2dfmt_tbl, getCanvas().getFormat());
1066     if (g2dfmt && (g2dfmt->g2dfmt & G2D_DATAFORMAT_SBWC))
1067         hasBackground = true;
1068 
1069     if (hasBackground) {
1070         layercount++;
1071 
1072         if (layercount > getCapabilities().maxLayerCount()) {
1073             ALOGE("Too many layers %d with the default background color configured", layerCount());
1074             return false;
1075         }
1076     }
1077 
1078     if (!reallocLayer(layercount))
1079         return false;
1080 
1081     sortLayers();
1082 
1083     mTask.flags = 0;
1084 
1085     if (!prepareImage(getCanvas(), mTask.target, mTask.commands.target, -1)) {
1086         ALOGE("Failed to configure the target image");
1087         return false;
1088     }
1089 
1090     if (getCanvas().isOTF())
1091         mTask.flags |= G2D_FLAG_HWFC;
1092 
1093     unsigned int baseidx = 0;
1094 
1095     if (hasBackground) {
1096         baseidx++;
1097         prepareSolidLayer(getCanvas(), mTask.source[0], mTask.commands.source[0]);
1098     }
1099 
1100     mTask.commands.target[G2DSFR_DST_YCBCRMODE] = 0;
1101 
1102     CSCMatrixWriter cscMatrixWriter(mTask.commands.target[G2DSFR_IMG_COLORMODE],
1103                                     getCanvas().getDataspace(),
1104                                     &mTask.commands.target[G2DSFR_DST_YCBCRMODE]);
1105 
1106     mTask.commands.target[G2DSFR_DST_YCBCRMODE] |= (G2D_LAYER_YCBCRMODE_OFFX | G2D_LAYER_YCBCRMODE_OFFY);
1107 
1108     for (unsigned int i = baseidx; i < layercount; i++) {
1109         AcrylicLayer &layer = *getLayer(i - baseidx);
1110 
1111         if (!prepareSource(layer, mTask.source[i],
1112                            mTask.commands.source[i], getCanvas().getImageDimension(),
1113                            i, i - baseidx)) {
1114             ALOGE("Failed to configure source layer %u", i - baseidx);
1115             return false;
1116         }
1117 
1118         if (!cscMatrixWriter.configure(mTask.commands.source[i][G2DSFR_IMG_COLORMODE],
1119                                        layer.getDataspace(),
1120                                        &mTask.commands.source[i][G2DSFR_SRC_YCBCRMODE])) {
1121             ALOGE("Failed to configure CSC coefficient of layer %d for dataspace %u",
1122                   i, layer.getDataspace());
1123             return false;
1124         }
1125 
1126         mHdrWriter.setLayerStaticMetadata(i, layer.getDataspace(),
1127                                           layer.getMinMasteringLuminance(),
1128                                           layer.getMaxMasteringLuminance());
1129 
1130         bool alpha_premult = (layer.getCompositingMode() == HWC_BLENDING_PREMULT)
1131                              || (layer.getCompositingMode() == HWC2_BLEND_MODE_PREMULTIPLIED);
1132         mHdrWriter.setLayerImageInfo(i, layer.getFormat(), alpha_premult);
1133         mHdrWriter.setLayerOpaqueData(i, layer.getLayerData(), layer.getLayerDataLength());
1134     }
1135 
1136     mHdrWriter.setTargetInfo(getCanvas().getDataspace(), getTargetDisplayInfo());
1137     mHdrWriter.setTargetDisplayLuminance(getMinTargetDisplayLuminance(), getMaxTargetDisplayLuminance());
1138 
1139     mHdrWriter.getCommands();
1140     mHdrWriter.getLayerHdrMode(mTask);
1141 
1142     mTask.num_source = layercount;
1143 
1144     if (nonblocking)
1145         mTask.flags |= G2D_FLAG_NONBLOCK;
1146 
1147     mTask.num_release_fences = num_fences;
1148     mTask.release_fence = reinterpret_cast<int *>(alloca(sizeof(int) * num_fences));
1149 
1150     mTask.commands.num_extra_regs = cscMatrixWriter.getRegisterCount() +
1151                                     mHdrWriter.getCommandCount();
1152     if (mUsePolyPhaseFilter)
1153         mTask.commands.num_extra_regs += getFilterCoefficientCount(mTask.commands.source, layercount);
1154 
1155     mTask.commands.extra = reinterpret_cast<g2d_reg *>(alloca(sizeof(g2d_reg) * mTask.commands.num_extra_regs));
1156 
1157     g2d_reg *regs = mTask.commands.extra;
1158 
1159     regs += cscMatrixWriter.write(regs);
1160 
1161     regs += updateFilterCoefficients(layercount, regs);
1162 
1163     mHdrWriter.write(regs);
1164 
1165     debug_show_g2d_task(mTask);
1166 
1167     if (ioctlG2D() < 0) {
1168         ALOGERR("Failed to process a task");
1169         show_g2d_task(mTask);
1170         return false;
1171     }
1172 
1173     mHdrWriter.putCommands();
1174 
1175     if (!!(mTask.flags & G2D_FLAG_ERROR)) {
1176         ALOGE("Error occurred during processing a task to G2D");
1177         show_g2d_task(mTask);
1178         return false;
1179     }
1180 
1181     getCanvas().clearSettingModified();
1182     getCanvas().setFence(-1);
1183 
1184     for (unsigned int i = 0; i < layerCount(); i++) {
1185         getLayer(i)->clearSettingModified();
1186         getLayer(i)->setFence(-1);
1187     }
1188 
1189     for (unsigned int i = 0; i < num_fences; i++)
1190         fence[i] = mTask.release_fence[i];
1191 
1192     return true;
1193 }
1194 
execute(int fence[],unsigned int num_fences)1195 bool AcrylicCompositorG2D::execute(int fence[], unsigned int num_fences)
1196 {
1197     if (!executeG2D(fence, num_fences, true)) {
1198         // Clearing all acquire fences because their buffers are expired.
1199         // The clients should configure everything again to start new execution
1200         for (unsigned int i = 0; i < layerCount(); i++)
1201             getLayer(i)->setFence(-1);
1202         getCanvas().setFence(-1);
1203 
1204         return false;
1205     }
1206 
1207     return true;
1208 }
1209 
execute(int * handle)1210 bool AcrylicCompositorG2D::execute(int *handle)
1211 {
1212     if (!executeG2D(NULL, 0, handle ? true : false)) {
1213         // Clearing all acquire fences because their buffers are expired.
1214         // The clients should configure everything again to start new execution
1215         for (unsigned int i = 0; i < layerCount(); i++)
1216             getLayer(i)->setFence(-1);
1217         getCanvas().setFence(-1);
1218 
1219         return false;
1220     }
1221 
1222     if (handle != NULL)
1223         *handle = 1; /* dummy handle */
1224 
1225     return true;
1226 }
1227 
waitExecution(int __unused handle)1228 bool AcrylicCompositorG2D::waitExecution(int __unused handle)
1229 {
1230     ALOGD_TEST("Waiting for execution of m2m1shot2 G2D completed by handle %d", handle);
1231 
1232     return true;
1233 }
1234 
requestPerformanceQoS(AcrylicPerformanceRequest * request)1235 bool AcrylicCompositorG2D::requestPerformanceQoS(AcrylicPerformanceRequest *request)
1236 {
1237     g2d_performance data;
1238 
1239     memset(&data, 0, sizeof(data));
1240 
1241     if (!request || (request->getFrameCount() == 0)) {
1242         if (mDev.ioctl(G2D_IOC_PERFORMANCE, &data) < 0) {
1243             ALOGERR("Failed to cancel performance request");
1244             return false;
1245         }
1246 
1247         ALOGD_TEST("Canceled performance request");
1248         return true;
1249     }
1250 
1251     ALOGD_TEST("Requesting performance: frame count %d:", request->getFrameCount());
1252     for (int i = 0; i < request->getFrameCount(); i++) {
1253         AcrylicPerformanceRequestFrame *frame = request->getFrame(i);
1254         uint64_t bandwidth = 0;
1255         bool src_yuv420_8b;
1256         bool src_rotate;
1257 
1258         src_rotate = false;
1259         src_yuv420_8b = false;
1260 
1261         unsigned int bpp;
1262         uint8_t planecount;
1263         uint32_t equiv_fmt;
1264         for (int idx = 0; idx < frame->getLayerCount(); idx++) {
1265             AcrylicPerformanceRequestLayer *layer = &(frame->mLayers[idx]);
1266             uint64_t layer_bw, pixelcount;
1267             int32_t is_scaling;
1268             uint32_t src_hori = layer->mSourceRect.size.hori;
1269             uint32_t src_vert = layer->mSourceRect.size.vert;
1270             uint32_t dst_hori = layer->mTargetRect.size.hori;
1271             uint32_t dst_vert = layer->mTargetRect.size.vert;
1272             data.frame[i].layer[idx].crop_width = src_hori;
1273             data.frame[i].layer[idx].crop_height = src_vert;
1274             data.frame[i].layer[idx].window_width = dst_hori;
1275             data.frame[i].layer[idx].window_height = dst_vert;
1276 
1277             // Src layer crop size is used when calculating read bandwidth.
1278             // Crop coordinates should be aligned in multiples of 16.
1279             pixelcount = (ALIGN(layer->mSourceRect.pos.hori + src_hori, 16) -
1280                           ALIGN_DOWN(layer->mSourceRect.pos.hori, 16)) *
1281                          (ALIGN(layer->mSourceRect.pos.vert + src_vert, 16) -
1282                           ALIGN_DOWN(layer->mSourceRect.pos.vert, 16));
1283 
1284             bpp = halfmt_bpp(layer->mPixFormat);
1285             planecount = halfmt_plane_count(layer->mPixFormat);
1286             equiv_fmt = find_format_equivalent(layer->mPixFormat);
1287 
1288             if (equiv_fmt == HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_SBWC ||
1289                 equiv_fmt == HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_10B_SBWC)
1290                 data.frame[i].layer[idx].layer_attr |= G2D_PERF_LAYER_SBWC;
1291             else if (layer->mAttribute & AcrylicCanvas::ATTR_COMPRESSED) {
1292                 if (planecount == 1)
1293                     data.frame[i].layer[idx].layer_attr |= G2D_PERF_LAYER_RGB_AFBC;
1294                 else
1295                     data.frame[i].layer[idx].layer_attr |= G2D_PERF_LAYER_YUV_AFBC;
1296             } else if (planecount == 2)
1297                 data.frame[i].layer[idx].layer_attr |= G2D_PERF_LAYER_YUV2P;
1298 
1299             // src_yuv420_8b is used when calculating write bandwidth
1300             if (bpp == 12) src_yuv420_8b = true;
1301 
1302             layer_bw = pixelcount * bpp;
1303             // Below is checking if scaling is involved.
1304             // Comparisons are replaced by additions to avoid branches.
1305             if (!!(layer->mTransform & HAL_TRANSFORM_ROT_90)) {
1306                 src_rotate = true;
1307                 data.frame[i].layer[idx].layer_attr |= G2D_PERF_LAYER_ROTATE;
1308 
1309                 is_scaling = src_hori - dst_vert;
1310                 is_scaling += src_vert - dst_hori;
1311             } else {
1312                 is_scaling = src_hori - dst_hori;
1313                 is_scaling += src_vert - dst_vert;
1314             }
1315             // Weight to the bandwidth when scaling is involved is 1.125.
1316             // It is multiplied by 16 to avoid multiplication with a real number.
1317             // We also get benefit from shift instead of multiplication.
1318             if (is_scaling == 0) {
1319                 layer_bw <<= 4; // layer_bw * 16
1320             } else {
1321                 layer_bw = (layer_bw << 4) + (layer_bw << 1); // layer_bw * 18
1322             }
1323 
1324             bandwidth += layer_bw;
1325             ALOGD_TEST("        LAYER[%d]: BW %llu FMT %#x(%u) (%dx%d)@(%dx%d)on(%dx%d) --> (%dx%d)@(%dx%d) TRFM %#x",
1326                     idx, static_cast<unsigned long long>(layer_bw), layer->mPixFormat, bpp,
1327                     layer->mSourceRect.size.hori, layer->mSourceRect.size.vert,
1328                     layer->mSourceRect.pos.hori, layer->mSourceRect.pos.vert,
1329                     layer->mSourceDimension.hori, layer->mSourceDimension.vert,
1330                     layer->mTargetRect.size.hori, layer->mTargetRect.size.vert,
1331                     layer->mTargetRect.pos.hori, layer->mTargetRect.pos.vert, layer->mTransform);
1332         }
1333 
1334         bandwidth *= frame->mFrameRate;
1335         bandwidth >>= 17; // divide by 16(weight), 8(bpp) and 1024(kilobyte)
1336 
1337         data.frame[i].bandwidth_read = static_cast<uint32_t>(bandwidth);
1338 
1339         bpp = halfmt_bpp(frame->mTargetPixFormat);
1340         bandwidth = frame->mTargetDimension.hori * frame->mTargetDimension.vert;
1341         bandwidth *= frame->mFrameRate * bpp;
1342 
1343         // When src rotation is involved, src format includes yuv420(8bit-depth)
1344         // and dst format is yuv420(8bit-depth), weight to the write bandwidth is 2.
1345         // RSH 12 : bw * 2 / (bits_per_byte * kilobyte)
1346         // RHS 13 : bw * 1 / (bits_per_byte * kilobyte)
1347         bandwidth >>= ((bpp == 12) && src_yuv420_8b && src_rotate) ? 12 : 13;
1348         data.frame[i].bandwidth_write = static_cast<uint32_t>(bandwidth);
1349 
1350         if (frame->mHasBackgroundLayer)
1351             data.frame[i].frame_attr |= G2D_PERF_FRAME_SOLIDCOLORFILL;
1352 
1353         data.frame[i].num_layers = frame->getLayerCount();
1354         data.frame[i].target_pixelcount = frame->mTargetDimension.vert * frame->mTargetDimension.hori;
1355         data.frame[i].frame_rate = frame->mFrameRate;
1356 
1357         ALOGD_TEST("    FRAME[%d]: BW:(%u, %u) Layercount %d, Framerate %d, Target %dx%d, FMT %#x Background? %d",
1358             i, data.frame[i].bandwidth_read, data.frame[i].bandwidth_write, data.frame[i].num_layers, frame->mFrameRate,
1359             frame->mTargetDimension.hori, frame->mTargetDimension.vert, frame->mTargetPixFormat,
1360             frame->mHasBackgroundLayer);
1361     }
1362 
1363     data.num_frame = request->getFrameCount();
1364 
1365     if (mDev.ioctl(G2D_IOC_PERFORMANCE, &data) < 0) {
1366         ALOGERR("Failed to request performance");
1367         return false;
1368     }
1369 
1370     return true;
1371 }
1372 
prioritize(int priority)1373 int AcrylicCompositorG2D::prioritize(int priority)
1374 {
1375     static int32_t g2d_priorities[] = {
1376             G2D_LOW_PRIORITY,     // 0
1377             G2D_MEDIUM_PRIORITY,  // 1
1378             G2D_HIGH_PRIORITY,    // 2
1379     };
1380 
1381     if (priority == mPriority)
1382         return 0;
1383 
1384     if (Acrylic::prioritize(priority) < 0)
1385         return -1;
1386 
1387     int32_t arg;
1388 
1389     if (priority > 2)
1390         arg = G2D_HIGHEST_PRIORITY;
1391     else if (priority < 0)
1392         arg = G2D_DEFAULT_PRIORITY;
1393     else
1394         arg = g2d_priorities[priority];
1395 
1396     if (mDev.ioctl(G2D_IOC_PRIORITY, &arg) < 0) {
1397         if (errno != EBUSY) {
1398             ALOGERR("Failed to set priority on a context of G2D");
1399             return -1;
1400         }
1401 
1402         ALOGD("G2D Driver returned EBUSY but the priority of %d(%d) is successfully applied", priority, arg);
1403         return 1;
1404     }
1405 
1406     ALOGD_TEST("Applied the priority of %d(%d) successfully", priority, arg);
1407 
1408     mPriority = priority;
1409 
1410     return 0;
1411 }
1412