1 /*
2  * Copyright Samsung Electronics Co.,LTD.
3  * Copyright (C) 2017 The Android Open Source Project
4  *
5  * Licensed under the Apache License, Version 2.0 (the "License");
6  * you may not use this file except in compliance with the License.
7  * You may obtain a copy of the License at
8  *
9  *     http://www.apache.org/licenses/LICENSE-2.0
10  *
11  * Unless required by applicable law or agreed to in writing, software
12  * distributed under the License is distributed on an "AS IS" BASIS,
13  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14  * See the License for the specific language governing permissions and
15  * limitations under the License.
16  */
17 
18 #define ATRACE_TAG (ATRACE_TAG_GRAPHICS | ATRACE_TAG_HAL)
19 
20 #include "acrylic_g2d.h"
21 
22 #include <alloca.h>
23 #include <exynos_format.h> // hardware/smasung_slsi/exynos/include
24 #include <hardware/hwcomposer2.h>
25 #include <log/log.h>
26 #include <sys/ioctl.h>
27 #include <system/graphics.h>
28 #include <utils/Trace.h>
29 
30 #include <algorithm>
31 #include <cstring>
32 
33 enum {
34     G2D_CSC_STD_UNDEFINED = -1,
35     G2D_CSC_STD_601       = 0,
36     G2D_CSC_STD_709       = 1,
37     G2D_CSC_STD_2020      = 2,
38     G2D_CSC_STD_P3        = 3,
39 
40     G2D_CSC_STD_COUNT     = 4,
41 };
42 
43 enum {
44     G2D_CSC_RANGE_LIMITED,
45     G2D_CSC_RANGE_FULL,
46 
47     G2D_CSC_RANGE_COUNT,
48 };
49 
50 static char csc_std_to_matrix_index[] = {
51     G2D_CSC_STD_709,                          // HAL_DATASPACE_STANDARD_UNSPECIFIED
52     G2D_CSC_STD_709,                          // HAL_DATASPACE_STANDARD_BT709
53     G2D_CSC_STD_601,                          // HAL_DATASPACE_STANDARD_BT601_625
54     G2D_CSC_STD_601,                          // HAL_DATASPACE_STANDARD_BT601_625_UNADJUSTED
55     G2D_CSC_STD_601,                          // HAL_DATASPACE_STANDARD_BT601_525
56     G2D_CSC_STD_601,                          // HAL_DATASPACE_STANDARD_BT601_525_UNADJUSTED
57     G2D_CSC_STD_2020,                         // HAL_DATASPACE_STANDARD_BT2020
58     G2D_CSC_STD_2020,                         // HAL_DATASPACE_STANDARD_BT2020_CONSTANT_LUMINANCE
59     static_cast<char>(G2D_CSC_STD_UNDEFINED), // HAL_DATASPACE_STANDARD_BT470M
60     G2D_CSC_STD_709,                          // HAL_DATASPACE_STANDARD_FILM
61     G2D_CSC_STD_P3,                           // HAL_DATASPACE_STANDARD_DCI_P3
62     static_cast<char>(G2D_CSC_STD_UNDEFINED), // HAL_DATASPACE_STANDARD_ADOBE_RGB
63 };
64 
65 static uint16_t YCbCr2sRGBCoefficients[G2D_CSC_STD_COUNT * G2D_CSC_RANGE_COUNT][9] = {
66     {0x0254, 0x0000, 0x0331, 0x0254, 0xFF37, 0xFE60, 0x0254, 0x0409, 0x0000}, // 601 limited
67     {0x0200, 0x0000, 0x02BE, 0x0200, 0xFF54, 0xFE9B, 0x0200, 0x0377, 0x0000}, // 601 full
68     {0x0254, 0x0000, 0x0396, 0x0254, 0xFF93, 0xFEEF, 0x0254, 0x043A, 0x0000}, // 709 limited
69     {0x0200, 0x0000, 0x0314, 0x0200, 0xFFA2, 0xFF16, 0x0200, 0x03A1, 0x0000}, // 709 full
70     {0x0254, 0x0000, 0x035B, 0x0254, 0xFFA0, 0xFEB3, 0x0254, 0x0449, 0x0000}, // 2020 limited
71     {0x0200, 0x0000, 0x02E2, 0x0200, 0xFFAE, 0xFEE2, 0x0200, 0x03AE, 0x0000}, // 2020 full
72     {0x0254, 0x0000, 0x03AE, 0x0254, 0xFF96, 0xFEEE, 0x0254, 0x0456, 0x0000}, // DCI-P3 limited
73     {0x0200, 0x0000, 0x0329, 0x0200, 0xFFA5, 0xFF15, 0x0200, 0x03B9, 0x0000}, // DCI-P3 full
74 };
75 
76 static uint16_t sRGB2YCbCrCoefficients[G2D_CSC_STD_COUNT * G2D_CSC_RANGE_COUNT][9] = {
77     {0x0083, 0x0102, 0x0032, 0xFFB4, 0xFF6B, 0x00E1, 0x00E1, 0xFF44, 0xFFDB}, // 601 limited
78     {0x0099, 0x012D, 0x003A, 0xFFA8, 0xFF53, 0x0106, 0x0106, 0xFF25, 0xFFD5}, // 601 full
79     {0x005D, 0x013A, 0x0020, 0xFFCC, 0xFF53, 0x00E1, 0x00E1, 0xFF34, 0xFFEB}, // 709 limited
80     {0x006D, 0x016E, 0x0025, 0xFFC4, 0xFF36, 0x0106, 0x0106, 0xFF12, 0xFFE8}, // 709 full
81     {0x0074, 0x012A, 0x001A, 0xFFC1, 0xFF5A, 0x00E1, 0x00E1, 0xFF31, 0xFFEE}, // 2020 limited
82     {0x0087, 0x015B, 0x001E, 0xFFB7, 0xFF43, 0x0106, 0x0106, 0xFF0F, 0xFFEB}, // 2020 full
83     {0x006B, 0x0171, 0x0023, 0xFFC6, 0xFF3A, 0x0100, 0x0100, 0xFF16, 0xFFEA}, // DCI-P3 limited(full)
84     {0x006B, 0x0171, 0x0023, 0xFFC6, 0xFF3A, 0x0100, 0x0100, 0xFF16, 0xFFEA}, // DCI-P3 full
85 };
86 
87 #define CSC_MATRIX_REGISTER_COUNT 9
88 #define CSC_MATRIX_REGISTER_SIZE  (CSC_MATRIX_REGISTER_COUNT * sizeof(uint32_t))
89 
g2dfmt_is_ycbcr(unsigned int g2dfmt)90 static inline bool g2dfmt_is_ycbcr(unsigned int g2dfmt)
91 {
92     g2dfmt &= G2D_DATAFMT_MASK;
93     return (G2D_DATAFMT_YUV_MIN <= g2dfmt) && (g2dfmt <= G2D_DATAFMT_YUV_MAX);
94 }
95 
96 class CSCMatrixWriter {
97     enum { CSC_MATRIX_MAX_COUNT = 4, CSC_MATRIX_INVALID_INDEX = 200 };
98     enum { CSC_MATRIX_SRC_BASE = 0x2000, CSC_MATRIX_DST_BASE = 0x2100 };
99 public:
CSCMatrixWriter(unsigned int g2dfmt,unsigned int dataspace,uint32_t * command)100     CSCMatrixWriter(unsigned int g2dfmt, unsigned int dataspace, uint32_t *command)
101                     : mMatrixCount(0), mMatrixTargetIndex(CSC_MATRIX_INVALID_INDEX) {
102         // Ignore if unsupported dataspace is specified.
103         // G2D also works for the case.
104         // But the correctness of the result is not guaranteed.
105         if (g2dfmt_is_ycbcr(g2dfmt)) {
106             mMatrixTargetIndex = findMatrixIndex(dataspace);
107             if ((dataspace & HAL_DATASPACE_RANGE_FULL) != 0)
108                 *command = G2D_LAYER_YCBCRMODE_WIDE;
109         }
110     }
111 
configure(unsigned int g2dfmt,unsigned int dataspace,uint32_t * command)112     bool configure(unsigned int g2dfmt, unsigned int dataspace, uint32_t *command) {
113         if (!g2dfmt_is_ycbcr(g2dfmt))
114             return true;
115 
116         unsigned int spcidx = findMatrixIndex(dataspace);
117 
118         if (spcidx == CSC_MATRIX_INVALID_INDEX)
119             return false;
120 
121         if ((dataspace & HAL_DATASPACE_RANGE_FULL) != 0)
122             *command = G2D_LAYER_YCBCRMODE_WIDE;
123 
124         for (int i = 0; i < mMatrixCount; i++) {
125             if (mMatrixIndex[i] == spcidx) {
126                 *command |= i;
127                 return true;
128             }
129         }
130 
131         if (mMatrixCount == CSC_MATRIX_MAX_COUNT) {
132             ALOGE("Too many CSC requirements");
133             return false;
134         }
135 
136         mMatrixIndex[mMatrixCount] = spcidx;
137 
138         *command |= mMatrixCount++;
139 
140         return true;
141     }
142 
getRegisterCount()143     unsigned int getRegisterCount() {
144         unsigned int count = CSC_MATRIX_REGISTER_COUNT * mMatrixCount;
145         if (mMatrixTargetIndex != CSC_MATRIX_INVALID_INDEX)
146             count += CSC_MATRIX_REGISTER_COUNT;
147         return count;
148     }
149 
write(g2d_reg regs[])150     unsigned int write(g2d_reg regs[]) {
151         unsigned int count = 0;
152 
153         if (mMatrixTargetIndex != CSC_MATRIX_INVALID_INDEX) {
154             writeSingle(CSC_MATRIX_DST_BASE,
155                         &regs[count], sRGB2YCbCrCoefficients[mMatrixTargetIndex]);
156             count += CSC_MATRIX_REGISTER_COUNT;
157         }
158 
159         for (int m = 0; m < mMatrixCount; m++) {
160             writeSingle(CSC_MATRIX_SRC_BASE + m * CSC_MATRIX_REGISTER_SIZE,
161                         &regs[count], YCbCr2sRGBCoefficients[mMatrixIndex[m]]);
162             count += CSC_MATRIX_REGISTER_COUNT;
163         }
164 
165         return count;
166     }
167 
168 private:
writeSingle(unsigned int base,g2d_reg regs[],uint16_t matrix[9])169     void writeSingle(unsigned int base, g2d_reg regs[], uint16_t matrix[9]) {
170         for (unsigned int idx = 0; idx < CSC_MATRIX_REGISTER_COUNT; idx++) {
171             regs[idx].offset = base;
172             regs[idx].value = matrix[idx];
173             base += sizeof(uint32_t);
174         }
175     }
176 
findMatrixIndex(unsigned int dataspace)177     unsigned int findMatrixIndex(unsigned int dataspace) {
178         unsigned int index, colorspace;
179 
180         colorspace = (dataspace & HAL_DATASPACE_STANDARD_MASK) >> HAL_DATASPACE_STANDARD_SHIFT;
181         if (colorspace >= ARRSIZE(csc_std_to_matrix_index)) {
182             ALOGE("Data space %d is not supported by G2D", dataspace);
183             return CSC_MATRIX_INVALID_INDEX;
184         }
185 
186         index = csc_std_to_matrix_index[colorspace] * G2D_CSC_RANGE_COUNT;
187         if ((dataspace & HAL_DATASPACE_RANGE_FULL) != 0)
188             index++;
189 
190         return index;
191     }
192 
193     unsigned int mMatrixIndex[CSC_MATRIX_MAX_COUNT];
194     int mMatrixCount;
195     unsigned int mMatrixTargetIndex;
196 };
197 
198 #define G2D_FILTER_COEF_BASE 0x6000
199 #define G2D_FILTER_COEF_REG(idx) (0x6000 + (idx) * 0x400)
200 #define G2D_FILTER_C_OFFSET 0x200
201 #define G2D_SCALE_FACTOR(from, to) ((static_cast<uint32_t>(from) << G2D_SCALEFACTOR_FRACBITS) / (to))
202 
203 #define SI11(v)                              static_cast<uint32_t>((v) & 0x7FF)
204 #define FILTER_HCOEF(a, b, c, d, e, f, g, h) {SI11(a), SI11(b), SI11(c), SI11(d), SI11(e), SI11(f), SI11(g), SI11(h)}
205 #define FILTER_VCOEF(a, b, c, d)             {SI11(a), SI11(b), SI11(c), SI11(d)}
206 
207 #define NUM_HORI_COEFFICIENTS 8
208 #define NUM_VERT_COEFFICIENTS 4
209 #define NUM_FILTER_PHASE 9
210 #define NUM_FILTER_COEF_SETS 7
211 
212 #define NUM_VERT_COEF_REGS (NUM_FILTER_PHASE * NUM_VERT_COEFFICIENTS)
213 #define NUM_HORI_COEF_REGS (NUM_FILTER_PHASE * NUM_HORI_COEFFICIENTS)
214 
215 static uint32_t g2dHoriFilterCoef[NUM_FILTER_COEF_SETS][NUM_FILTER_PHASE][NUM_HORI_COEFFICIENTS] = {
216     { // Upsampling
217         FILTER_HCOEF(   0,   0,   0, 512,   0,   0,   0,   0), FILTER_HCOEF(  -2,   8, -25, 509,  30,  -9,   2,  -1), FILTER_HCOEF(  -4,  14, -46, 499,  64, -19,   5,  -1),
218         FILTER_HCOEF(  -5,  20, -62, 482, 101, -30,   8,  -2), FILTER_HCOEF(  -5,  23, -73, 458, 142, -41,  12,  -3), FILTER_HCOEF(  -6,  25, -80, 429, 185, -53,  15,  -3),
219         FILTER_HCOEF(  -6,  26, -83, 395, 228, -63,  19,  -4), FILTER_HCOEF(  -6,  25, -82, 357, 273, -71,  21,  -5), FILTER_HCOEF(  -5,  23, -78, 316, 316, -78,  23,  -5),
220     }, { // x7/8 Downsampling
221         FILTER_HCOEF(  12, -32,  56, 444,  52, -32,  12,   0), FILTER_HCOEF(   9, -24,  29, 445,  82, -39,  13,  -3), FILTER_HCOEF(   7, -16,   6, 438, 112, -46,  14,  -3),
222         FILTER_HCOEF(   5,  -9, -14, 426, 144, -52,  15,  -3), FILTER_HCOEF(   3,  -3, -30, 410, 177, -58,  16,  -3), FILTER_HCOEF(   2,   2, -43, 390, 211, -63,  16,  -3),
223         FILTER_HCOEF(   1,   7, -53, 365, 244, -66,  16,  -2), FILTER_HCOEF(   0,  10, -60, 338, 277, -66,  15,  -2), FILTER_HCOEF(  -1,  13, -65, 309, 309, -65,  13,  -1),
224     }, { // x6/8 Downsampling
225         FILTER_HCOEF(   8, -44, 100, 384, 100, -44,   8,   0), FILTER_HCOEF(   9, -40,  77, 382, 123, -47,   8,   0), FILTER_HCOEF(   8, -36,  57, 377, 147, -49,   7,   1),
226         FILTER_HCOEF(   8, -32,  38, 369, 171, -49,   5,   2), FILTER_HCOEF(   8, -27,  20, 358, 196, -48,   3,   2), FILTER_HCOEF(   7, -22,   5, 344, 221, -47,   1,   3),
227         FILTER_HCOEF(   7, -18,  -9, 329, 245, -43,  -2,   3), FILTER_HCOEF(   5, -13, -20, 310, 268, -37,  -5,   4), FILTER_HCOEF(   5,  -9, -30, 290, 290, -30,  -9,   5),
228     }, { // x5/8 Downsampling
229         FILTER_HCOEF(  -3, -31, 130, 320, 130, -31,  -3,   0), FILTER_HCOEF(  -3, -32, 113, 319, 147, -29,  -6,   3), FILTER_HCOEF(  -1, -33,  97, 315, 165, -26,  -8,   3),
230         FILTER_HCOEF(   0, -32,  81, 311, 182, -22, -11,   3), FILTER_HCOEF(   1, -31,  66, 304, 199, -17, -13,   3), FILTER_HCOEF(   2, -30,  52, 296, 216, -11, -16,   3),
231         FILTER_HCOEF(   2, -28,  38, 286, 232,  -3, -18,   3), FILTER_HCOEF(   3, -25,  26, 274, 247,   5, -21,   3), FILTER_HCOEF(   3, -23,  15, 261, 261,  15, -23,   3),
232     }, { // x4/8 Downsampling
233         FILTER_HCOEF( -11,   0, 140, 255, 140,   0, -12,   0), FILTER_HCOEF( -10,  -4, 129, 254, 151,   5, -13,   0), FILTER_HCOEF(  -9,  -7, 117, 253, 163,  10, -14,  -1),
234         FILTER_HCOEF(  -8, -10, 106, 250, 174,  16, -15,  -1), FILTER_HCOEF(  -7, -12,  95, 246, 185,  22, -16,  -1), FILTER_HCOEF(  -6, -14,  85, 241, 195,  29, -16,  -2),
235         FILTER_HCOEF(  -5, -15,  74, 236, 204,  37, -17,  -2), FILTER_HCOEF(  -5, -16,  64, 229, 214,  46, -17,  -3), FILTER_HCOEF(  -4, -17,  55, 222, 222,  55, -17,  -4),
236     }, { // x3/8 Downsampling
237         FILTER_HCOEF(  -5,  31, 133, 195, 133,  31,  -6,   0), FILTER_HCOEF(  -5,  27, 126, 195, 139,  37,  -4,  -3), FILTER_HCOEF(  -5,  23, 119, 194, 146,  41,  -3,  -3),
238         FILTER_HCOEF(  -5,  19, 112, 193, 152,  47,  -2,  -4), FILTER_HCOEF(  -5,  16, 105, 191, 158,  53,  -2,  -4), FILTER_HCOEF(  -5,  12,  98, 189, 163,  59,   0,  -4),
239         FILTER_HCOEF(  -5,  10,  91, 185, 169,  65,   1,  -4), FILTER_HCOEF(  -5,   7,  84, 182, 174,  71,   3,  -4), FILTER_HCOEF(  -5,   5,  78, 178, 178,  78,   5,  -5),
240     }, { // x2/8 Downsampling
241         FILTER_HCOEF(  10,  52, 118, 152, 118,  52,  10,   0), FILTER_HCOEF(   9,  48, 114, 152, 122,  56,  11,   0), FILTER_HCOEF(   7,  45, 110, 151, 125,  60,  13,   1),
242         FILTER_HCOEF(   6,  41, 106, 150, 129,  64,  15,   1), FILTER_HCOEF(   5,  38, 102, 149, 132,  68,  17,   1), FILTER_HCOEF(   4,  35,  98, 148, 135,  72,  19,   1),
243         FILTER_HCOEF(   4,  31,  94, 146, 138,  77,  21,   1), FILTER_HCOEF(   3,  29,  89, 145, 140,  81,  23,   2), FILTER_HCOEF(   2,  26,  85, 143, 143,  85,  26,   2),
244     }
245 };
246 
247 static uint32_t g2dVertFilterCoef[NUM_FILTER_COEF_SETS][NUM_FILTER_PHASE][NUM_VERT_COEFFICIENTS] = {
248     {    // Upsampling
249         FILTER_VCOEF(   0, 512,   0,   0), FILTER_VCOEF( -15, 508,  20,  -1), FILTER_VCOEF( -25, 495,  45,  -3),
250         FILTER_VCOEF( -31, 473,  75,  -5), FILTER_VCOEF( -33, 443, 110,  -8), FILTER_VCOEF( -33, 408, 148, -11),
251         FILTER_VCOEF( -31, 367, 190, -14), FILTER_VCOEF( -27, 324, 234, -19), FILTER_VCOEF( -23, 279, 279, -23),
252     }, { // x7/8 Downsampling
253         FILTER_VCOEF(  32, 448,  32,   0), FILTER_VCOEF(  17, 446,  55,  -6), FILTER_VCOEF(   3, 437,  79,  -7),
254         FILTER_VCOEF(  -7, 421, 107,  -9), FILTER_VCOEF( -14, 399, 138, -11), FILTER_VCOEF( -18, 373, 170, -13),
255         FILTER_VCOEF( -20, 343, 204, -15), FILTER_VCOEF( -20, 310, 240, -18), FILTER_VCOEF( -19, 275, 275, -19),
256     }, { // x6/8 Downsampling
257         FILTER_VCOEF(  61, 390,  61,   0), FILTER_VCOEF(  46, 390,  83,  -7), FILTER_VCOEF(  31, 383, 106,  -8),
258         FILTER_VCOEF(  19, 371, 130,  -8), FILTER_VCOEF(   9, 356, 156,  -9), FILTER_VCOEF(   2, 337, 183, -10),
259         FILTER_VCOEF(  -3, 315, 210, -10), FILTER_VCOEF(  -7, 291, 238, -10), FILTER_VCOEF(  -9, 265, 265,  -9),
260     }, { // x5/8 Downsampling
261         FILTER_VCOEF(  85, 341,  86,   0), FILTER_VCOEF(  71, 341, 105,  -5), FILTER_VCOEF(  56, 336, 124,  -4),
262         FILTER_VCOEF(  43, 328, 145,  -4), FILTER_VCOEF(  32, 317, 166,  -3), FILTER_VCOEF(  23, 304, 187,  -2),
263         FILTER_VCOEF(  16, 288, 209,  -1), FILTER_VCOEF(   9, 271, 231,   1), FILTER_VCOEF(   5, 251, 251,   5),
264     }, { // x4/8 Downsampling
265         FILTER_VCOEF( 104, 304, 104,   0), FILTER_VCOEF(  89, 302, 120,   1), FILTER_VCOEF(  76, 298, 136,   2),
266         FILTER_VCOEF(  63, 293, 153,   3), FILTER_VCOEF(  52, 285, 170,   5), FILTER_VCOEF(  42, 275, 188,   7),
267         FILTER_VCOEF(  33, 264, 205,  10), FILTER_VCOEF(  26, 251, 221,  14), FILTER_VCOEF(  20, 236, 236,  20),
268     }, { // x3/8 Downsampling
269         FILTER_VCOEF( 118, 276, 118,   0), FILTER_VCOEF( 103, 273, 129,   7), FILTER_VCOEF(  90, 270, 143,   9),
270         FILTER_VCOEF(  78, 266, 157,  11), FILTER_VCOEF(  67, 260, 171,  14), FILTER_VCOEF(  57, 253, 185,  17),
271         FILTER_VCOEF(  48, 244, 199,  21), FILTER_VCOEF(  40, 234, 211,  27), FILTER_VCOEF(  33, 223, 223,  33),
272     }, { // x2/8 Downsampling
273         FILTER_VCOEF( 127, 258, 127,   0), FILTER_VCOEF( 111, 252, 135,  14), FILTER_VCOEF( 100, 250, 147,  15),
274         FILTER_VCOEF(  88, 247, 159,  18), FILTER_VCOEF(  78, 242, 171,  21), FILTER_VCOEF(  68, 237, 182,  25),
275         FILTER_VCOEF(  59, 230, 193,  30), FILTER_VCOEF(  50, 222, 204,  36), FILTER_VCOEF(  43, 213, 213,  43),
276     }
277 };
278 
findFilterCoefficientsIndex(uint32_t factor)279 static unsigned int findFilterCoefficientsIndex(uint32_t factor)
280 {
281     static uint32_t choicetable[NUM_FILTER_COEF_SETS] = {
282         G2D_SCALE_FACTOR(8, 8), G2D_SCALE_FACTOR(8, 7), G2D_SCALE_FACTOR(8, 6), G2D_SCALE_FACTOR(8, 5),
283         G2D_SCALE_FACTOR(8, 4), G2D_SCALE_FACTOR(8, 3), G2D_SCALE_FACTOR(8, 2),
284     };
285 
286     for (unsigned int i = 0; i < NUM_FILTER_COEF_SETS; i++)
287         if (factor <= choicetable[i])
288             return i;
289     // if i == NUM_FILTER_COEF_SETS, the downsampling factor is larger than 4.0 which is not supported by the filter.
290     return NUM_FILTER_COEF_SETS - 1;
291 }
292 
293 template<typename CoefT>
__writeFilterCoefficients(CoefT & coef_set,unsigned int index,uint32_t base,g2d_reg regs[])294 static unsigned int __writeFilterCoefficients(CoefT &coef_set, unsigned int index, uint32_t base, g2d_reg regs[])
295 {
296     // The default value of filter coefficients are values of 8:8/zoom-in
297     // So, do not update redundantly.
298     if (index == 0)
299         return 0;
300 
301     unsigned int cnt = 0;
302 
303     for (auto &coef_table: coef_set[index]) {
304         uint32_t coef_base = base;
305         // register offsets of filter coeffcients are ordered by phase number then tab index
306         // while values are ordered by tab index then phase number in the above coefficients array.
307         // So register offset is increased by the number of tabs instead of 1.
308         // The coefficients array is specified in the order of tab index due to readability
309         // because the coefficient values are also specified in the same order in UM.
310         for (auto coef: coef_table) {
311             regs[cnt].offset = coef_base;
312             regs[cnt].value = coef;
313             coef_base += (sizeof(coef_set[index]) / sizeof(coef_table)) * sizeof(coef_table[0]);
314             cnt++;
315         }
316         base += sizeof(uint32_t);
317     }
318 
319     return cnt;
320 }
321 
getChromaScaleFactor(uint32_t colormode,unsigned int * hfactor,unsigned int * vfactor)322 void getChromaScaleFactor(uint32_t colormode, unsigned int *hfactor, unsigned int *vfactor)
323 {
324     switch (colormode & G2D_DATAFMT_MASK) {
325         case G2D_DATAFMT_YUV420SP:
326         case G2D_DATAFMT_YUV420P:
327             *hfactor /= 2;
328             [[fallthrough]];
329         case G2D_DATAFMT_YUV422SP:
330         case G2D_DATAFMT_YUV422I:
331             *vfactor /= 2;
332             break;
333         default:
334             break;
335     }
336 }
337 
writeFilterCoefficients(uint32_t hfactor,uint32_t vfactor,uint32_t colormode,unsigned layer_index,g2d_reg regs[])338 static unsigned int writeFilterCoefficients(uint32_t hfactor, uint32_t vfactor, uint32_t colormode,
339                                             unsigned layer_index, g2d_reg regs[])
340 {
341     unsigned int hindex = findFilterCoefficientsIndex(hfactor);
342     unsigned int vindex = findFilterCoefficientsIndex(vfactor);
343     // Filter coefficients of 1:1 and upsampling are configured to the filter by default (reset value)
344     if ((hindex == 0) && (vindex == 0))
345         return 0;
346 
347     unsigned int base = G2D_FILTER_COEF_REG(layer_index);
348     unsigned int cnt = 0;
349     // Y Coefficients
350     cnt += __writeFilterCoefficients(g2dVertFilterCoef, vindex, base, regs);
351     cnt += __writeFilterCoefficients(g2dHoriFilterCoef, hindex, base + sizeof(g2dVertFilterCoef[0]), regs + cnt);
352     if (IS_YUV(colormode)) {
353         // C Coefficients
354         getChromaScaleFactor(colormode, &hfactor, &vfactor);
355 
356         hindex = findFilterCoefficientsIndex(hfactor);
357         vindex = findFilterCoefficientsIndex(vfactor);
358         base += G2D_FILTER_C_OFFSET;
359         cnt += __writeFilterCoefficients(g2dVertFilterCoef, vindex, base, regs + cnt);
360         cnt += __writeFilterCoefficients(g2dHoriFilterCoef, hindex, base + sizeof(g2dVertFilterCoef[0]), regs + cnt);
361     }
362 
363     return cnt;
364 }
365 
getFilterCoefficientCount(uint32_t * src_cmds[],unsigned int layer_count)366 static unsigned int getFilterCoefficientCount(uint32_t *src_cmds[], unsigned int layer_count)
367 {
368     unsigned int count = 0;
369 
370 
371     for (unsigned int i = 0; i < layer_count; i++) {
372         unsigned int layer_coef_cnt = 0;
373         unsigned int hfactor = src_cmds[i][G2DSFR_SRC_XSCALE];
374         unsigned int vfactor = src_cmds[i][G2DSFR_SRC_YSCALE];
375 
376         if (hfactor > G2D_SCALE_FACTOR(8, 8))
377             layer_coef_cnt += NUM_HORI_COEF_REGS;
378         if (vfactor > G2D_SCALE_FACTOR(8, 8))
379             layer_coef_cnt += NUM_VERT_COEF_REGS;
380         if (IS_YUV(src_cmds[i][G2DSFR_IMG_COLORMODE])) {
381             getChromaScaleFactor(src_cmds[i][G2DSFR_IMG_COLORMODE], &hfactor, &vfactor);
382             if (hfactor > G2D_SCALE_FACTOR(8, 8))
383                 layer_coef_cnt += NUM_HORI_COEF_REGS;
384             if (vfactor > G2D_SCALE_FACTOR(8, 8))
385                 layer_coef_cnt += NUM_VERT_COEF_REGS;
386         }
387 
388         count += layer_coef_cnt;
389     }
390 
391     return count;
392 }
393 
show_g2d_layer(const char * title,int idx,const g2d_layer & layer)394 static void show_g2d_layer(const char *title, int idx, const g2d_layer &layer)
395 {
396     ALOGD("%s%d: flags %#x, fence %d, buffer_type %d, num_buffers %d", title, idx,
397           layer.flags, layer.fence, layer.buffer_type, layer.num_buffers);
398     for (unsigned int i = 0; i < layer.num_buffers; i++) {
399         ALOGD("         buf[%d] ptr %p, fd %d, offset %u, length %u",
400               i, layer.buffer[i].userptr,
401               layer.buffer[i].dmabuf.fd, layer.buffer[i].dmabuf.offset,
402               layer.buffer[i].length);
403     }
404 }
405 
show_g2d_commands(const g2d_commands & cmds)406 static void show_g2d_commands(const g2d_commands &cmds)
407 {
408     for (unsigned int i = 0; i < G2DSFR_DST_FIELD_COUNT; i++)
409         ALOGD("DST[%02d]: %#010x", i, cmds.target[i]);
410 
411     for (unsigned int idx = 0; idx < G2D_MAX_IMAGES; idx++) {
412         if (cmds.source[idx]) {
413             for (unsigned int i = 0; i < G2DSFR_SRC_FIELD_COUNT; i++)
414                 ALOGD("SRC[%02d][%02d]: %#010x", idx, i, cmds.source[idx][i]);
415         }
416     }
417 
418     if (cmds.extra) {
419         for (unsigned int i = 0; i < cmds.num_extra_regs; i++)
420             ALOGD("EXTRA: offset %#010x, value %#010x",
421                   cmds.extra[i].offset, cmds.extra[i].value);
422     }
423 }
424 
show_g2d_task(const g2d_task & task)425 static void show_g2d_task(const g2d_task &task)
426 {
427     ALOGD("Showing the content of G2D task descriptor ver %#010x", task.version);
428     ALOGD("source count %d, flags %#x, priority %d, num_release_fences %d",
429           task.num_source, task.flags, task.priority, task.num_release_fences);
430     show_g2d_layer("Target", 0, task.target);
431     for (unsigned int i = 0; i < task.num_source; i++)
432         show_g2d_layer("Source", i, task.source[i]);
433     show_g2d_commands(task.commands);
434 }
435 
436 #ifdef LIBACRYL_DEBUG
debug_show_g2d_task(const g2d_task & task)437 static void debug_show_g2d_task(const g2d_task &task)
438 {
439     ALOGD("Showing the content of G2D task descriptor ver %#010x", task.version);
440     ALOGD("source count %d, flags %#x, priority %d, num_release_fences %d",
441           task.num_source, task.flags, task.priority, task.num_release_fences);
442     show_g2d_layer("Target", 0, task.target);
443     for (unsigned int i = 0; i < task.num_source; i++)
444         show_g2d_layer("Source", i, task.source[i]);
445     show_g2d_commands(task.commands);
446 }
447 #else
448 #define debug_show_g2d_task(task) do { } while (0)
449 #endif
450 
451 struct g2d_fmt {
452     uint32_t halfmt;
453     uint32_t g2dfmt;
454     uint32_t num_bufs;
455     uint32_t rgb_bpp;
456 };
457 
458 static g2d_fmt __halfmt_to_g2dfmt_legacy[] = {
459 //  {halfmt,                                      g2dfmt,  num_buffers, rgbbpp}
460     {HAL_PIXEL_FORMAT_RGBA_8888,                  G2D_FMT_ABGR8888,  1, 4},
461     {HAL_PIXEL_FORMAT_BGRA_8888,                  G2D_FMT_ARGB8888,  1, 4},
462     {HAL_PIXEL_FORMAT_RGBX_8888,                  G2D_FMT_XBGR8888,  1, 4},
463     {HAL_PIXEL_FORMAT_RGBA_1010102,               G2D_FMT_ABGR2101010, 1, 4},
464     {HAL_PIXEL_FORMAT_RGB_888,                    G2D_FMT_RGB888,    1, 3},
465     {HAL_PIXEL_FORMAT_RGB_565,                    G2D_FMT_RGB565,    1, 2},
466 //  {HAL_PIXEL_FORMAT_YV12,                       G2D_FMT_YV12,      1, 0},
467 //  {HAL_PIXEL_FORMAT_EXYNOS_YV12_M,              G2D_FMT_YV12,      3, 0},
468     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_P,         G2D_FMT_YV12,      1, 0},
469     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_PN,        G2D_FMT_YV12,      1, 0},
470     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_P_M,       G2D_FMT_YV12,      3, 0},
471     {HAL_PIXEL_FORMAT_YCrCb_420_SP,               G2D_FMT_NV21,      1, 0},
472     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M,      G2D_FMT_NV21,      2, 0},
473     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M_FULL, G2D_FMT_NV21,      2, 0},
474     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP,        G2D_FMT_NV12,      1, 0},
475     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M,      G2D_FMT_NV12,      2, 0},
476     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN,       G2D_FMT_NV12,      1, 0},
477     {HAL_PIXEL_FORMAT_YCBCR_P010,                 G2D_FMT_NV12_P010_LGCY, 1, 0},
478     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_P010_M,        G2D_FMT_NV12_P010_LGCY, 2, 0},
479     {HAL_PIXEL_FORMAT_YCbCr_422_I,                G2D_FMT_YUYV,      1, 0},
480     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_422_I,         G2D_FMT_YVYU,      1, 0},
481     {HAL_PIXEL_FORMAT_YCbCr_422_SP,               G2D_FMT_NV16,      1, 0},
482     // TODO: add p010
483 };
484 
485 static g2d_fmt __halfmt_to_g2dfmt[] = {
486 //  {halfmt,                                      g2dfmt,  num_buffers, rgbbpp}
487     {HAL_PIXEL_FORMAT_RGBA_8888,                  G2D_FMT_ABGR8888,  1, 4},
488     {HAL_PIXEL_FORMAT_BGRA_8888,                  G2D_FMT_ARGB8888,  1, 4},
489     {HAL_PIXEL_FORMAT_RGBX_8888,                  G2D_FMT_XBGR8888,  1, 4},
490     {HAL_PIXEL_FORMAT_RGBA_1010102,               G2D_FMT_ABGR2101010, 1, 4},
491     {HAL_PIXEL_FORMAT_RGB_888,                    G2D_FMT_RGB888,    1, 3},
492     {HAL_PIXEL_FORMAT_RGB_565,                    G2D_FMT_RGB565,    1, 2},
493     {HAL_PIXEL_FORMAT_YV12,                       G2D_FMT_YV12,      1, 0},
494     {HAL_PIXEL_FORMAT_EXYNOS_YV12_M,              G2D_FMT_YV12,      3, 0},
495     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_P,         G2D_FMT_YUV420P,   1, 0},
496     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_PN,        G2D_FMT_YUV420P,   1, 0},
497     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_P_M,       G2D_FMT_YUV420P,   3, 0},
498     {HAL_PIXEL_FORMAT_YCrCb_420_SP,               G2D_FMT_NV21,      1, 0},
499     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M,      G2D_FMT_NV21,      2, 0},
500     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M_FULL, G2D_FMT_NV21,      2, 0},
501     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP,        G2D_FMT_NV12,      1, 0},
502     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M,      G2D_FMT_NV12,      2, 0},
503     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN,       G2D_FMT_NV12,      1, 0},
504     {HAL_PIXEL_FORMAT_GOOGLE_NV12_SP,             G2D_FMT_NV12,      1, 0},
505     {HAL_PIXEL_FORMAT_YCBCR_P010,                 G2D_FMT_NV12_P010, 1, 0},
506     {HAL_PIXEL_FORMAT_GOOGLE_NV12_SP_10B,         G2D_FMT_NV12_P010, 1, 0},
507     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_P010_M,        G2D_FMT_NV12_P010, 2, 0},
508     {HAL_PIXEL_FORMAT_YCbCr_422_I,                G2D_FMT_YUYV,      1, 0},
509     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_422_I,         G2D_FMT_YVYU,      1, 0},
510     {HAL_PIXEL_FORMAT_YCbCr_422_SP,               G2D_FMT_NV16,      1, 0},
511     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_SBWC,     G2D_FMT_NV12_SBWC, 2, 0},
512     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_SBWC,      G2D_FMT_NV12_SBWC, 1, 0},
513     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC, G2D_FMT_NV12_SBWC_10B, 2, 0},
514     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_10B_SBWC,  G2D_FMT_NV12_SBWC_10B, 1, 0},
515     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M_SBWC,     G2D_FMT_NV21_SBWC, 2, 0},
516     {HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M_10B_SBWC, G2D_FMT_NV21_SBWC_10B, 2, 0},
517     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_SBWC_L50, G2D_FMT_NV12_SBWC, 2, 0},
518     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC_L40, G2D_FMT_NV12_SBWC_10B, 2, 0},
519     {HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC_L80, G2D_FMT_NV12_SBWC_10B, 2, 0},
520 };
521 
halfmt_to_g2dfmt(struct g2d_fmt * tbl,size_t tbl_len,uint32_t halfmt)522 static g2d_fmt *halfmt_to_g2dfmt(struct g2d_fmt *tbl, size_t tbl_len, uint32_t halfmt)
523 {
524     for (size_t i = 0 ; i < tbl_len; i++) {
525         if (tbl[i].halfmt == halfmt)
526             return &tbl[i];
527     }
528 
529     ALOGE("Unable to find the proper G2D format for HAL format %#x", halfmt);
530 
531     return NULL;
532 }
533 
AcrylicCompositorG2D(const HW2DCapability & capability,bool newcolormode)534 AcrylicCompositorG2D::AcrylicCompositorG2D(const HW2DCapability &capability, bool newcolormode)
535     : Acrylic(capability), mDev((capability.maxLayerCount() > 2) ? "/dev/g2d" : "/dev/fimg2d"),
536       mMaxSourceCount(0), mPriority(-1)
537 {
538     memset(&mTask, 0, sizeof(mTask));
539 
540     mVersion = 0;
541     if (mDev.ioctl(G2D_IOC_VERSION, &mVersion) < 0)
542         ALOGERR("Failed to get G2D command version");
543     ALOGI("G2D API Version %d", mVersion);
544 
545     halfmt_to_g2dfmt_tbl = newcolormode ? __halfmt_to_g2dfmt : __halfmt_to_g2dfmt_legacy;
546     len_halfmt_to_g2dfmt_tbl = newcolormode ? ARRSIZE(__halfmt_to_g2dfmt) : ARRSIZE(__halfmt_to_g2dfmt_legacy);
547 
548     mUsePolyPhaseFilter = getCapabilities().supportedMinDecimation() == hw2d_coord_t{4, 4};
549 
550     ALOGD_TEST("Created a new Acrylic for G2D on %p", this);
551 }
552 
~AcrylicCompositorG2D()553 AcrylicCompositorG2D::~AcrylicCompositorG2D()
554 {
555     delete [] mTask.source;
556     delete [] mTask.commands.target;
557     for (unsigned int i = 0; i < mMaxSourceCount; i++)
558         delete [] mTask.commands.source[i];
559 
560     ALOGD_TEST("Deleting Acrylic for G2D on %p", this);
561 }
562 
updateFilterCoefficients(unsigned int layercount,g2d_reg regs[])563 unsigned int AcrylicCompositorG2D::updateFilterCoefficients(unsigned int layercount, g2d_reg regs[])
564 {
565     if (!mUsePolyPhaseFilter)
566         return 0;
567 
568     unsigned int cnt = 0;
569 
570     for (unsigned int i = 0; i < layercount; i++)
571         cnt += writeFilterCoefficients(mTask.commands.source[i][G2DSFR_SRC_XSCALE],
572                                        mTask.commands.source[i][G2DSFR_SRC_YSCALE],
573                                        mTask.commands.source[i][G2DSFR_IMG_COLORMODE],
574                                        i, regs + cnt);
575 
576     return cnt;
577 }
578 
579 #define SBWC_BLOCK_WIDTH 32
580 #define SBWC_BLOCK_HEIGHT 4
581 #define SBWC_BLOCK_SIZE(bit) (SBWC_BLOCK_WIDTH * SBWC_BLOCK_HEIGHT * (bit) / 8)
582 
583 #define SBWC_HEADER_ALIGN 16
584 #define SBWC_PAYLOAD_ALIGN 32
585 
586 #define SBWC_HEADER_STRIDE(w) \
587 	ALIGN(((w) / SBWC_BLOCK_WIDTH / 2), SBWC_HEADER_ALIGN)
588 #define SBWC_PAYLOAD_STRIDE(w, dep)\
589 	ALIGN(((w) / SBWC_BLOCK_WIDTH) * SBWC_BLOCK_SIZE(dep), \
590 	      SBWC_PAYLOAD_ALIGN)
591 
592 #define SBWC_LOSSY_PAYLOAD_STRIDE(w, block_byte) \
593 	ALIGN(((w) / SBWC_BLOCK_WIDTH) * (block_byte), \
594 	      SBWC_PAYLOAD_ALIGN)
595 
596 static uint32_t mfc_stride_formats[] = {
597     HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN,
598     HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_SBWC,
599     HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_SBWC,
600     HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC,
601     HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_10B_SBWC,
602     HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M_SBWC,
603     HAL_PIXEL_FORMAT_EXYNOS_YCrCb_420_SP_M_10B_SBWC,
604 };
605 
606 static unsigned int sbwc_lossy_formats[] = {
607     HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_SBWC_L50,
608     HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC_L40,
609     HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SP_M_10B_SBWC_L80,
610 };
611 
prepareImage(AcrylicCanvas & layer,struct g2d_layer & image,uint32_t cmd[],int index)612 bool AcrylicCompositorG2D::prepareImage(AcrylicCanvas &layer, struct g2d_layer &image, uint32_t cmd[], int index)
613 {
614     image.flags = 0;
615 
616     if (layer.getFence() >= 0) {
617         image.flags |= G2D_LAYERFLAG_ACQUIRE_FENCE;
618         image.fence = layer.getFence();
619     }
620 
621     if (layer.isProtected())
622         image.flags |= G2D_LAYERFLAG_SECURE;
623 
624     g2d_fmt *g2dfmt = halfmt_to_g2dfmt(halfmt_to_g2dfmt_tbl, len_halfmt_to_g2dfmt_tbl, layer.getFormat());
625     if (!g2dfmt)
626         return false;
627 
628     image.flags &= ~G2D_LAYERFLAG_MFC_STRIDE;
629     for (size_t i = 0; i < ARRSIZE(mfc_stride_formats); i++) {
630         if (layer.getFormat() == mfc_stride_formats[i]) {
631             image.flags |= G2D_LAYERFLAG_MFC_STRIDE;
632             break;
633         }
634     }
635 
636     if (layer.getBufferType() == AcrylicCanvas::MT_EMPTY) {
637         image.buffer_type = G2D_BUFTYPE_EMPTY;
638     } else {
639         if (layer.getBufferCount() < g2dfmt->num_bufs) {
640             ALOGE("HAL Format %#x requires %d buffers but %d buffers are given",
641                     layer.getFormat(), g2dfmt->num_bufs, layer.getBufferCount());
642             return false;
643         }
644 
645         if (layer.getBufferType() == AcrylicCanvas::MT_DMABUF) {
646             image.buffer_type = G2D_BUFTYPE_DMABUF;
647             for (unsigned int i = 0; i < g2dfmt->num_bufs; i++) {
648                 image.buffer[i].dmabuf.fd = layer.getDmabuf(i);
649                 image.buffer[i].dmabuf.offset = layer.getOffset(i);
650                 image.buffer[i].length = layer.getBufferLength(i);
651             }
652         } else {
653             LOGASSERT(layer.getBufferType() == AcrylicCanvas::MT_USERPTR,
654                       "Unknown buffer type %d", layer.getBufferType());
655             image.buffer_type = G2D_BUFTYPE_USERPTR;
656             for (unsigned int i = 0; i < g2dfmt->num_bufs; i++) {
657                 image.buffer[i].userptr = layer.getUserptr(i);
658                 image.buffer[i].length = layer.getBufferLength(i);
659             }
660         }
661     }
662 
663     image.num_buffers = g2dfmt->num_bufs;
664 
665     hw2d_coord_t xy = layer.getImageDimension();
666 
667     cmd[G2DSFR_IMG_COLORMODE] = g2dfmt->g2dfmt;
668     if (layer.isUOrder())
669         cmd[G2DSFR_IMG_COLORMODE] |= G2D_DATAFORMAT_UORDER;
670 
671     if (layer.isCompressed()) {
672         // AFBC forces RGB swizzling order to BGR for RGB565
673         if (g2dfmt->g2dfmt == G2D_FMT_RGB565)
674             cmd[G2DSFR_IMG_COLORMODE] = G2D_FMT_BGR565;
675         cmd[G2DSFR_IMG_COLORMODE] |= G2D_DATAFORMAT_AFBC;
676         cmd[G2DSFR_IMG_STRIDE] = 0;
677     } else if (g2dfmt->g2dfmt & G2D_DATAFORMAT_SBWC) {
678         cmd[G2DSFR_IMG_STRIDE] = 0;
679     } else {
680         cmd[G2DSFR_IMG_STRIDE] = g2dfmt->rgb_bpp * xy.hori;
681     }
682 
683     unsigned int payload = 0, header = 0, lossyByteNum = 0;
684 
685     if (g2dfmt->g2dfmt & G2D_DATAFORMAT_SBWC) {
686         unsigned int blocksize;
687         unsigned int isLossy = 0;
688         unsigned int format = layer.getFormat();
689 
690         for (unsigned int i = 0; i < ARRSIZE(sbwc_lossy_formats); i++) {
691             if (format == sbwc_lossy_formats[i]) {
692                 isLossy = 1;
693                 blocksize = (i < 2) ? 64 : 128;
694                 break;
695             }
696         }
697 
698         if (isLossy) {
699             lossyByteNum = (blocksize >> 1) | isLossy;
700             payload = SBWC_LOSSY_PAYLOAD_STRIDE(xy.hori, blocksize);
701         } else {
702             payload = SBWC_PAYLOAD_STRIDE(xy.hori, (g2dfmt->g2dfmt & G2D_FMT_YCBCR_10BIT) ? 10 : 8);
703             header = SBWC_HEADER_STRIDE(xy.hori);
704         }
705     }
706 
707     if (index < 0) {
708         cmd[G2DSFR_DST_Y_HEADER_STRIDE] = header;
709         cmd[G2DSFR_DST_C_HEADER_STRIDE] = header;
710         cmd[G2DSFR_DST_Y_PAYLOAD_STRIDE] = payload;
711         cmd[G2DSFR_DST_C_PAYLOAD_STRIDE] = payload;
712         cmd[G2DSFR_DST_SBWCINFO] = lossyByteNum;
713     } else {
714         cmd[G2DSFR_SRC_Y_HEADER_STRIDE] = header;
715         cmd[G2DSFR_SRC_C_HEADER_STRIDE] = header;
716         cmd[G2DSFR_SRC_Y_PAYLOAD_STRIDE] = payload;
717         cmd[G2DSFR_SRC_C_PAYLOAD_STRIDE] = payload;
718         cmd[G2DSFR_SRC_SBWCINFO] = lossyByteNum;
719     }
720 
721     cmd[G2DSFR_IMG_LEFT]   = 0;
722     cmd[G2DSFR_IMG_TOP]    = 0;
723     cmd[G2DSFR_IMG_RIGHT]  = xy.hori;
724     cmd[G2DSFR_IMG_BOTTOM] = xy.vert;
725     cmd[G2DSFR_IMG_WIDTH]  = xy.hori;
726     cmd[G2DSFR_IMG_HEIGHT] = xy.vert;
727 
728     return true;
729 }
730 
setSolidLayer(struct g2d_layer & image,uint32_t cmd[],hw2d_coord_t xy)731 static void setSolidLayer(struct g2d_layer &image, uint32_t cmd[], hw2d_coord_t xy)
732 {
733     image.flags = G2D_LAYERFLAG_COLORFILL;
734     image.buffer_type = G2D_BUFTYPE_EMPTY;
735     image.num_buffers = 0;
736 
737     cmd[G2DSFR_IMG_COLORMODE] = G2D_FMT_ARGB8888;
738     cmd[G2DSFR_IMG_STRIDE] = 4 * xy.hori;
739 
740     cmd[G2DSFR_IMG_WIDTH]  = xy.hori;
741     cmd[G2DSFR_IMG_HEIGHT] = xy.vert;
742 
743     cmd[G2DSFR_SRC_SELECT] = G2D_LAYERSEL_COLORFILL;
744     cmd[G2DSFR_SRC_COMMAND] = G2D_LAYERCMD_VALID;
745 
746     cmd[G2DSFR_SRC_ROTATE] = 0;
747     cmd[G2DSFR_SRC_SCALECONTROL] = 0;
748     cmd[G2DSFR_SRC_XSCALE] = G2D_SCALE_FACTOR(1, 1);
749     cmd[G2DSFR_SRC_YSCALE] = G2D_SCALE_FACTOR(1, 1);
750     cmd[G2DSFR_SRC_XPHASE] = 0;
751     cmd[G2DSFR_SRC_YPHASE] = 0;
752     cmd[G2DSFR_SRC_YCBCRMODE] = 0;
753     cmd[G2DSFR_SRC_HDRMODE] = 0;
754     cmd[G2DSFR_SRC_Y_HEADER_STRIDE] = 0;
755     cmd[G2DSFR_SRC_C_HEADER_STRIDE] = 0;
756     cmd[G2DSFR_SRC_Y_PAYLOAD_STRIDE] = 0;
757     cmd[G2DSFR_SRC_C_PAYLOAD_STRIDE] = 0;
758     cmd[G2DSFR_SRC_SBWCINFO] = 0;
759 }
760 
prepareSolidLayer(AcrylicCanvas & canvas,struct g2d_layer & image,uint32_t cmd[])761 bool AcrylicCompositorG2D::prepareSolidLayer(AcrylicCanvas &canvas, struct g2d_layer &image, uint32_t cmd[])
762 {
763     hw2d_coord_t xy = canvas.getImageDimension();
764 
765     setSolidLayer(image, cmd, xy);
766 
767     uint16_t a, r, g, b;
768     getBackgroundColor(&r, &g, &b, &a);
769 
770     cmd[G2DSFR_SRC_COLOR]  = (a & 0xFF00) << 16;
771     cmd[G2DSFR_SRC_COLOR] |= (r & 0xFF00) << 8;
772     cmd[G2DSFR_SRC_COLOR] |= (g & 0xFF00) << 0;
773     cmd[G2DSFR_SRC_COLOR] |= (b & 0xFF00) >> 8;
774 
775     cmd[G2DSFR_IMG_LEFT]   = 0;
776     cmd[G2DSFR_IMG_TOP]    = 0;
777     cmd[G2DSFR_IMG_RIGHT]  = xy.hori;
778     cmd[G2DSFR_IMG_BOTTOM] = xy.vert;
779 
780     cmd[G2DSFR_SRC_DSTLEFT]   = 0;
781     cmd[G2DSFR_SRC_DSTTOP]    = 0;
782     cmd[G2DSFR_SRC_DSTRIGHT]  = xy.hori;
783     cmd[G2DSFR_SRC_DSTBOTTOM] = xy.vert;
784 
785     cmd[G2DSFR_SRC_ALPHA] = 0;
786     cmd[G2DSFR_SRC_BLEND] = 0;
787 
788     return true;
789 }
790 
prepareSolidLayer(AcrylicLayer & layer,struct g2d_layer & image,uint32_t cmd[],hw2d_coord_t target_size,unsigned int index)791 bool AcrylicCompositorG2D::prepareSolidLayer(AcrylicLayer &layer, struct g2d_layer &image, uint32_t cmd[], hw2d_coord_t target_size, unsigned int index)
792 {
793     hw2d_coord_t xy = layer.getImageDimension();
794 
795     setSolidLayer(image, cmd, xy);
796 
797     cmd[G2DSFR_SRC_COLOR]  = layer.getSolidColor();
798 
799     hw2d_rect_t crop = layer.getImageRect();
800     cmd[G2DSFR_IMG_LEFT]   = crop.pos.hori;
801     cmd[G2DSFR_IMG_TOP]    = crop.pos.vert;
802     cmd[G2DSFR_IMG_RIGHT]  = crop.size.hori + crop.pos.hori;
803     cmd[G2DSFR_IMG_BOTTOM] = crop.size.vert + crop.pos.vert;
804 
805     hw2d_rect_t window = layer.getTargetRect();
806     if (area_is_zero(window))
807         window.size = target_size;
808     cmd[G2DSFR_SRC_DSTLEFT]   = window.pos.hori;
809     cmd[G2DSFR_SRC_DSTTOP]    = window.pos.vert;
810     cmd[G2DSFR_SRC_DSTRIGHT]  = window.size.hori + window.pos.hori;
811     cmd[G2DSFR_SRC_DSTBOTTOM] = window.size.vert + window.pos.vert;
812 
813     uint8_t alpha = layer.getPlaneAlpha();
814     cmd[G2DSFR_SRC_ALPHA] = (alpha << 24) | (alpha << 16) | (alpha << 8) | alpha;
815     if ((layer.getCompositingMode() == HWC_BLENDING_PREMULT) ||
816             (layer.getCompositingMode() == HWC2_BLEND_MODE_PREMULTIPLIED)) {
817         cmd[G2DSFR_SRC_BLEND] = G2D_BLEND_SRCOVER;
818     } else if ((layer.getCompositingMode() == HWC_BLENDING_COVERAGE) ||
819                (layer.getCompositingMode() == HWC2_BLEND_MODE_COVERAGE)) {
820         cmd[G2DSFR_SRC_BLEND] = G2D_BLEND_NONE;
821     } else {
822         cmd[G2DSFR_SRC_BLEND] = G2D_BLEND_SRCCOPY;
823     }
824 
825     /* bottom layer always is opaque */
826     if (index == 0) {
827        cmd[G2DSFR_SRC_COMMAND] |= G2D_LAYERCMD_OPAQUE;
828        if (alpha < 255)
829            cmd[G2DSFR_SRC_COMMAND] |= G2D_LAYERCMD_PREMULT_GLOBALALPHA;
830     } else {
831        cmd[G2DSFR_SRC_COMMAND] |= G2D_LAYERCMD_ALPHABLEND;
832     }
833 
834     return true;
835 }
836 
prepareSource(AcrylicLayer & layer,struct g2d_layer & image,uint32_t cmd[],hw2d_coord_t target_size,unsigned int index,unsigned int image_index)837 bool AcrylicCompositorG2D::prepareSource(AcrylicLayer &layer, struct g2d_layer &image, uint32_t cmd[],
838                                              hw2d_coord_t target_size, unsigned int index, unsigned int image_index)
839 {
840     if (layer.isSolidColor()) {
841         prepareSolidLayer(layer, image, cmd, target_size, image_index);
842 
843         return true;
844     }
845 
846     if (!prepareImage(layer, image, cmd, index))
847         return false;
848 
849     cmd[G2DSFR_SRC_SELECT] = 0;
850 
851     hw2d_rect_t crop = layer.getImageRect();
852     cmd[G2DSFR_IMG_LEFT]   = crop.pos.hori;
853     cmd[G2DSFR_IMG_TOP]    = crop.pos.vert;
854     cmd[G2DSFR_IMG_RIGHT]  = crop.size.hori + crop.pos.hori;
855     cmd[G2DSFR_IMG_BOTTOM] = crop.size.vert + crop.pos.vert;
856 
857     hw2d_rect_t window = layer.getTargetRect();
858     if (area_is_zero(window))
859         window.size = target_size;
860     cmd[G2DSFR_SRC_DSTLEFT]   = window.pos.hori;
861     cmd[G2DSFR_SRC_DSTTOP]    = window.pos.vert;
862     cmd[G2DSFR_SRC_DSTRIGHT]  = window.size.hori + window.pos.hori;
863     cmd[G2DSFR_SRC_DSTBOTTOM] = window.size.vert + window.pos.vert;
864 
865     if (layer.isCompressed()) {
866         cmd[G2DSFR_IMG_WIDTH]--;
867         cmd[G2DSFR_IMG_HEIGHT]--;
868     }
869 
870     cmd[G2DSFR_SRC_ROTATE] = 0;
871     // HAL FLIP value: FLIP_H=0x01, FLIP_V=0x02
872     // G2D FLIP value: FLIP_Y=0x05, FLIP_X=0x04
873     unsigned int flip = layer.getTransform() & (HAL_TRANSFORM_FLIP_H | HAL_TRANSFORM_FLIP_V);
874     if (!!(layer.getTransform() & HAL_TRANSFORM_ROT_90)) {
875         window.size.swap();
876 
877         cmd[G2DSFR_SRC_ROTATE] |= G2D_ROTATEDIR_ROT90CCW;
878         if (!flip || (flip == (HAL_TRANSFORM_FLIP_H | HAL_TRANSFORM_FLIP_V)))
879             flip = ~flip & (HAL_TRANSFORM_FLIP_H | HAL_TRANSFORM_FLIP_V);
880     }
881 
882     cmd[G2DSFR_SRC_ROTATE] |= flip << G2D_ROTATEDIR_FLIP_SHIFT;
883 
884     cmd[G2DSFR_SRC_XSCALE] = G2D_SCALE_FACTOR(crop.size.hori, window.size.hori);
885     cmd[G2DSFR_SRC_YSCALE] = G2D_SCALE_FACTOR(crop.size.vert, window.size.vert);
886     // Configure interpolation only if it is required.
887     // Otherwise, G2D needs more bandwidth because it interpolates pixels
888     // even though it is not required.
889     if ((cmd[G2DSFR_SRC_XSCALE] | cmd[G2DSFR_SRC_YSCALE]) == G2D_SCALE_FACTOR(1, 1))
890         cmd[G2DSFR_SRC_SCALECONTROL] = 0;
891     else if (mUsePolyPhaseFilter)
892         cmd[G2DSFR_SRC_SCALECONTROL] = (index << G2D_SCALECONTROL_FILTERCOEF_SHIFT) | G2D_SCALECONTROL_POLYPHASE;
893     else
894         cmd[G2DSFR_SRC_SCALECONTROL] = G2D_SCALECONTROL_BILINEAR;
895 
896     // TODO: Configure initial phases according to the scale factors
897      cmd[G2DSFR_SRC_XPHASE] = 0;
898      cmd[G2DSFR_SRC_YPHASE] = 0;
899 
900     uint8_t alpha = layer.getPlaneAlpha();
901     cmd[G2DSFR_SRC_ALPHA] = (alpha << 24) | (alpha << 16) | (alpha << 8) | alpha;
902     if ((layer.getCompositingMode() == HWC_BLENDING_PREMULT) ||
903             (layer.getCompositingMode() == HWC2_BLEND_MODE_PREMULTIPLIED)) {
904         cmd[G2DSFR_SRC_BLEND] = G2D_BLEND_SRCOVER;
905     } else if ((layer.getCompositingMode() == HWC_BLENDING_COVERAGE) ||
906                (layer.getCompositingMode() == HWC2_BLEND_MODE_COVERAGE)) {
907         cmd[G2DSFR_SRC_BLEND] = G2D_BLEND_NONE;
908     } else {
909         cmd[G2DSFR_SRC_BLEND] = G2D_BLEND_SRCCOPY;
910 
911         // HWC_BLEND_NONE is used not to appear its lower layer to target layer.
912         // But, when G2D output is reused by DPU, lower layer could appear to target layer.
913         // To prevent this, when blend mode is HWC_BLEND_NONE, make alpha channel max.
914         // Example case is as follow.
915         // If G2D composites several layers and topmost layer is HWC_BLEND_NONE
916         // and has alpha lower than max, that alpha value remains in target buffer.
917         // And if this result layer is recomposited with lower layer by DPU
918         // lower layer color appears to final result layer.
919         if ((cmd[G2DSFR_IMG_COLORMODE] == G2D_FMT_ABGR8888) ||
920             (cmd[G2DSFR_IMG_COLORMODE] == G2D_FMT_ARGB8888) ||
921             (cmd[G2DSFR_IMG_COLORMODE] == G2D_FMT_ABGR2101010)) {
922             cmd[G2DSFR_IMG_COLORMODE] &= ~G2D_SWZ_ALPHA_MASK;
923             cmd[G2DSFR_IMG_COLORMODE] |= G2D_SWZ_ALPHA_ONE;
924         }
925     }
926 
927     cmd[G2DSFR_SRC_COMMAND] = G2D_LAYERCMD_VALID;
928 
929     /* bottom layer always is opaque */
930     if (image_index == 0) {
931        cmd[G2DSFR_SRC_COMMAND] |= G2D_LAYERCMD_OPAQUE;
932        if (alpha < 255)
933            cmd[G2DSFR_SRC_COMMAND] |= G2D_LAYERCMD_PREMULT_GLOBALALPHA;
934     } else {
935        cmd[G2DSFR_SRC_COMMAND] |= G2D_LAYERCMD_ALPHABLEND;
936     }
937 
938     cmd[G2DSFR_SRC_YCBCRMODE] = 0;
939     cmd[G2DSFR_SRC_HDRMODE] = 0;
940 
941     return true;
942 }
943 
reallocLayer(unsigned int layercount)944 bool AcrylicCompositorG2D::reallocLayer(unsigned int layercount)
945 {
946     if (mMaxSourceCount >= layercount)
947         return true;
948 
949     if (!mTask.commands.target) {
950         mTask.commands.target = new uint32_t[G2DSFR_DST_FIELD_COUNT];
951         if (!mTask.commands.target) {
952             ALOGE("Failed to allocate command buffer for target image");
953             return false;
954         }
955 
956 	memset(mTask.commands.target, 0, sizeof(uint32_t) * G2DSFR_DST_FIELD_COUNT);
957     }
958 
959     delete [] mTask.source;
960     for (unsigned int i = 0; i < mMaxSourceCount; i++)
961         delete [] mTask.commands.source[i];
962 
963     mMaxSourceCount = 0;
964 
965     mTask.source = new g2d_layer[layercount];
966     if (!mTask.source) {
967         ALOGE("Failed to allocate %u source image descriptors", layercount);
968         return false;
969     }
970 
971     for (unsigned int i = 0; i < layercount; i++) {
972         mTask.commands.source[i] = new uint32_t[G2DSFR_SRC_FIELD_COUNT];
973         if (mTask.commands.source[i] == NULL) {
974             ALOGE("Failed to allocate command buffer for source image");
975             while (i-- > 0)
976                 delete [] mTask.commands.source[i];
977 
978             delete [] mTask.source;
979             mTask.source = NULL;
980 
981             return false;
982         }
983 
984 	memset(mTask.commands.source[i], 0, sizeof(uint32_t) * G2DSFR_SRC_FIELD_COUNT);
985     }
986 
987     mMaxSourceCount = layercount;
988 
989     return true;
990 }
991 
ioctlG2D(void)992 int AcrylicCompositorG2D::ioctlG2D(void)
993 {
994     if (mVersion == 1) {
995         if (mDev.ioctl(G2D_IOC_PROCESS, &mTask) < 0)
996             return -errno;
997     } else {
998         struct g2d_compat_task task;
999 
1000         memcpy(&task, &mTask, sizeof(mTask) - sizeof(mTask.commands));
1001         memcpy(task.commands.target, mTask.commands.target, sizeof(task.commands.target));
1002 
1003         for (unsigned int i = 0; i < mMaxSourceCount; i++)
1004             task.commands.source[i] = mTask.commands.source[i];
1005 
1006         task.commands.extra = mTask.commands.extra;
1007         task.commands.num_extra_regs = mTask.commands.num_extra_regs;
1008 
1009         if (mDev.ioctl(G2D_IOC_COMPAT_PROCESS, &task) < 0)
1010             return -errno;
1011 
1012         mTask.flags = task.flags;
1013         mTask.laptime_in_usec = task.laptime_in_usec;
1014 
1015         for (unsigned int i = 0; i < mTask.num_release_fences; i++)
1016             mTask.release_fence[i] = task.release_fence[i];
1017     }
1018 
1019     return 0;
1020 }
1021 
executeG2D(int fence[],unsigned int num_fences,bool nonblocking)1022 bool AcrylicCompositorG2D::executeG2D(int fence[], unsigned int num_fences, bool nonblocking)
1023 {
1024     ATRACE_CALL();
1025     if (!validateAllLayers())
1026         return false;
1027 
1028     unsigned int layercount = layerCount();
1029 
1030     // Set invalid fence fd to the entries exceeds the number of source and destination images
1031     for (unsigned int i = layercount; i < num_fences; i++)
1032         fence[i] = -1;
1033 
1034     if (num_fences > layercount + 1)
1035         num_fences = layercount + 1;
1036 
1037     bool hasBackground = hasBackgroundColor();
1038 
1039     g2d_fmt *g2dfmt = halfmt_to_g2dfmt(halfmt_to_g2dfmt_tbl, len_halfmt_to_g2dfmt_tbl, getCanvas().getFormat());
1040     if (g2dfmt && (g2dfmt->g2dfmt & G2D_DATAFORMAT_SBWC))
1041         hasBackground = true;
1042 
1043     if (hasBackground) {
1044         layercount++;
1045 
1046         if (layercount > getCapabilities().maxLayerCount()) {
1047             ALOGE("Too many layers %d with the default background color configured", layerCount());
1048             return false;
1049         }
1050     }
1051 
1052     if (!reallocLayer(layercount))
1053         return false;
1054 
1055     sortLayers();
1056 
1057     mTask.flags = 0;
1058 
1059     if (!prepareImage(getCanvas(), mTask.target, mTask.commands.target, -1)) {
1060         ALOGE("Failed to configure the target image");
1061         return false;
1062     }
1063 
1064     if (getCanvas().isOTF())
1065         mTask.flags |= G2D_FLAG_HWFC;
1066 
1067     unsigned int baseidx = 0;
1068 
1069     if (hasBackground) {
1070         baseidx++;
1071         prepareSolidLayer(getCanvas(), mTask.source[0], mTask.commands.source[0]);
1072     }
1073 
1074     mTask.commands.target[G2DSFR_DST_YCBCRMODE] = 0;
1075 
1076     CSCMatrixWriter cscMatrixWriter(mTask.commands.target[G2DSFR_IMG_COLORMODE],
1077                                     getCanvas().getDataspace(),
1078                                     &mTask.commands.target[G2DSFR_DST_YCBCRMODE]);
1079 
1080     mTask.commands.target[G2DSFR_DST_YCBCRMODE] |= (G2D_LAYER_YCBCRMODE_OFFX | G2D_LAYER_YCBCRMODE_OFFY);
1081 
1082     for (unsigned int i = baseidx; i < layercount; i++) {
1083         AcrylicLayer &layer = *getLayer(i - baseidx);
1084 
1085         if (!prepareSource(layer, mTask.source[i],
1086                            mTask.commands.source[i], getCanvas().getImageDimension(),
1087                            i, i - baseidx)) {
1088             ALOGE("Failed to configure source layer %u", i - baseidx);
1089             return false;
1090         }
1091 
1092         if (!cscMatrixWriter.configure(mTask.commands.source[i][G2DSFR_IMG_COLORMODE],
1093                                        layer.getDataspace(),
1094                                        &mTask.commands.source[i][G2DSFR_SRC_YCBCRMODE])) {
1095             ALOGE("Failed to configure CSC coefficient of layer %d for dataspace %u",
1096                   i, layer.getDataspace());
1097             return false;
1098         }
1099 
1100         mHdrWriter.setLayerStaticMetadata(i, layer.getDataspace(),
1101                                           layer.getMinMasteringLuminance(),
1102                                           layer.getMaxMasteringLuminance());
1103 
1104         bool alpha_premult = (layer.getCompositingMode() == HWC_BLENDING_PREMULT)
1105                              || (layer.getCompositingMode() == HWC2_BLEND_MODE_PREMULTIPLIED);
1106         mHdrWriter.setLayerImageInfo(i, layer.getFormat(), alpha_premult);
1107         mHdrWriter.setLayerOpaqueData(i, layer.getLayerData(), layer.getLayerDataLength());
1108     }
1109 
1110     mHdrWriter.setTargetInfo(getCanvas().getDataspace(), getTargetDisplayInfo());
1111     mHdrWriter.setTargetDisplayLuminance(getMinTargetDisplayLuminance(), getMaxTargetDisplayLuminance());
1112 
1113     mHdrWriter.getCommands();
1114     mHdrWriter.getLayerHdrMode(mTask);
1115 
1116     mTask.num_source = layercount;
1117 
1118     if (nonblocking)
1119         mTask.flags |= G2D_FLAG_NONBLOCK;
1120 
1121     mTask.num_release_fences = num_fences;
1122     mTask.release_fence = reinterpret_cast<int *>(alloca(sizeof(int) * num_fences));
1123 
1124     mTask.commands.num_extra_regs = cscMatrixWriter.getRegisterCount() +
1125                                     mHdrWriter.getCommandCount();
1126     if (mUsePolyPhaseFilter)
1127         mTask.commands.num_extra_regs += getFilterCoefficientCount(mTask.commands.source, layercount);
1128 
1129     mTask.commands.extra = reinterpret_cast<g2d_reg *>(alloca(sizeof(g2d_reg) * mTask.commands.num_extra_regs));
1130 
1131     g2d_reg *regs = mTask.commands.extra;
1132 
1133     regs += cscMatrixWriter.write(regs);
1134 
1135     regs += updateFilterCoefficients(layercount, regs);
1136 
1137     mHdrWriter.write(regs);
1138 
1139     debug_show_g2d_task(mTask);
1140 
1141     if (ioctlG2D() < 0) {
1142         ALOGERR("Failed to process a task");
1143         show_g2d_task(mTask);
1144         return false;
1145     }
1146 
1147     mHdrWriter.putCommands();
1148 
1149     if (!!(mTask.flags & G2D_FLAG_ERROR)) {
1150         ALOGE("Error occurred during processing a task to G2D");
1151         show_g2d_task(mTask);
1152         return false;
1153     }
1154 
1155     getCanvas().clearSettingModified();
1156     getCanvas().setFence(-1);
1157 
1158     for (unsigned int i = 0; i < layerCount(); i++) {
1159         getLayer(i)->clearSettingModified();
1160         getLayer(i)->setFence(-1);
1161     }
1162 
1163     for (unsigned int i = 0; i < num_fences; i++)
1164         fence[i] = mTask.release_fence[i];
1165 
1166     return true;
1167 }
1168 
execute(int fence[],unsigned int num_fences)1169 bool AcrylicCompositorG2D::execute(int fence[], unsigned int num_fences)
1170 {
1171     if (!executeG2D(fence, num_fences, true)) {
1172         // Clearing all acquire fences because their buffers are expired.
1173         // The clients should configure everything again to start new execution
1174         for (unsigned int i = 0; i < layerCount(); i++)
1175             getLayer(i)->setFence(-1);
1176         getCanvas().setFence(-1);
1177 
1178         return false;
1179     }
1180 
1181     return true;
1182 }
1183 
execute(int * handle)1184 bool AcrylicCompositorG2D::execute(int *handle)
1185 {
1186     if (!executeG2D(NULL, 0, handle ? true : false)) {
1187         // Clearing all acquire fences because their buffers are expired.
1188         // The clients should configure everything again to start new execution
1189         for (unsigned int i = 0; i < layerCount(); i++)
1190             getLayer(i)->setFence(-1);
1191         getCanvas().setFence(-1);
1192 
1193         return false;
1194     }
1195 
1196     if (handle != NULL)
1197         *handle = 1; /* dummy handle */
1198 
1199     return true;
1200 }
1201 
waitExecution(int __unused handle)1202 bool AcrylicCompositorG2D::waitExecution(int __unused handle)
1203 {
1204     ALOGD_TEST("Waiting for execution of m2m1shot2 G2D completed by handle %d", handle);
1205 
1206     return true;
1207 }
1208 
requestPerformanceQoS(AcrylicPerformanceRequest * request)1209 bool AcrylicCompositorG2D::requestPerformanceQoS(AcrylicPerformanceRequest *request)
1210 {
1211     g2d_performance data;
1212 
1213     memset(&data, 0, sizeof(data));
1214 
1215     if (!request || (request->getFrameCount() == 0)) {
1216         if (mDev.ioctl(G2D_IOC_PERFORMANCE, &data) < 0) {
1217             ALOGERR("Failed to cancel performance request");
1218             return false;
1219         }
1220 
1221         ALOGD_TEST("Canceled performance request");
1222         return true;
1223     }
1224 
1225     ALOGD_TEST("Requesting performance: frame count %d:", request->getFrameCount());
1226     for (int i = 0; i < request->getFrameCount(); i++) {
1227         AcrylicPerformanceRequestFrame *frame = request->getFrame(i);
1228         uint64_t bandwidth = 0;
1229         bool src_yuv420_8b;
1230         bool src_rotate;
1231 
1232         src_rotate = false;
1233         src_yuv420_8b = false;
1234 
1235         unsigned int bpp;
1236         uint8_t planecount;
1237         uint32_t equiv_fmt;
1238         for (int idx = 0; idx < frame->getLayerCount(); idx++) {
1239             AcrylicPerformanceRequestLayer *layer = &(frame->mLayers[idx]);
1240             uint64_t layer_bw, pixelcount;
1241             int32_t is_scaling;
1242             uint32_t src_hori = layer->mSourceRect.size.hori;
1243             uint32_t src_vert = layer->mSourceRect.size.vert;
1244             uint32_t dst_hori = layer->mTargetRect.size.hori;
1245             uint32_t dst_vert = layer->mTargetRect.size.vert;
1246             data.frame[i].layer[idx].crop_width = src_hori;
1247             data.frame[i].layer[idx].crop_height = src_vert;
1248             data.frame[i].layer[idx].window_width = dst_hori;
1249             data.frame[i].layer[idx].window_height = dst_vert;
1250 
1251             // Src layer crop size is used when calculating read bandwidth.
1252             // Crop coordinates should be aligned in multiples of 16.
1253             pixelcount = (ALIGN(layer->mSourceRect.pos.hori + src_hori, 16) -
1254                           ALIGN_DOWN(layer->mSourceRect.pos.hori, 16)) *
1255                          (ALIGN(layer->mSourceRect.pos.vert + src_vert, 16) -
1256                           ALIGN_DOWN(layer->mSourceRect.pos.vert, 16));
1257 
1258             bpp = halfmt_bpp(layer->mPixFormat);
1259             planecount = halfmt_plane_count(layer->mPixFormat);
1260             equiv_fmt = find_format_equivalent(layer->mPixFormat);
1261 
1262             if (equiv_fmt == HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_SBWC ||
1263                 equiv_fmt == HAL_PIXEL_FORMAT_EXYNOS_YCbCr_420_SPN_10B_SBWC)
1264                 data.frame[i].layer[idx].layer_attr |= G2D_PERF_LAYER_SBWC;
1265             else if (layer->mAttribute & AcrylicCanvas::ATTR_COMPRESSED) {
1266                 if (planecount == 1)
1267                     data.frame[i].layer[idx].layer_attr |= G2D_PERF_LAYER_RGB_AFBC;
1268                 else
1269                     data.frame[i].layer[idx].layer_attr |= G2D_PERF_LAYER_YUV_AFBC;
1270             } else if (planecount == 2)
1271                 data.frame[i].layer[idx].layer_attr |= G2D_PERF_LAYER_YUV2P;
1272 
1273             // src_yuv420_8b is used when calculating write bandwidth
1274             if (bpp == 12) src_yuv420_8b = true;
1275 
1276             layer_bw = pixelcount * bpp;
1277             // Below is checking if scaling is involved.
1278             // Comparisons are replaced by additions to avoid branches.
1279             if (!!(layer->mTransform & HAL_TRANSFORM_ROT_90)) {
1280                 src_rotate = true;
1281                 data.frame[i].layer[idx].layer_attr |= G2D_PERF_LAYER_ROTATE;
1282 
1283                 is_scaling = src_hori - dst_vert;
1284                 is_scaling += src_vert - dst_hori;
1285             } else {
1286                 is_scaling = src_hori - dst_hori;
1287                 is_scaling += src_vert - dst_vert;
1288             }
1289             // Weight to the bandwidth when scaling is involved is 1.125.
1290             // It is multiplied by 16 to avoid multiplication with a real number.
1291             // We also get benefit from shift instead of multiplication.
1292             if (is_scaling == 0) {
1293                 layer_bw <<= 4; // layer_bw * 16
1294             } else {
1295                 layer_bw = (layer_bw << 4) + (layer_bw << 1); // layer_bw * 18
1296             }
1297 
1298             bandwidth += layer_bw;
1299             ALOGD_TEST("        LAYER[%d]: BW %llu FMT %#x(%u) (%dx%d)@(%dx%d)on(%dx%d) --> (%dx%d)@(%dx%d) TRFM %#x",
1300                     idx, static_cast<unsigned long long>(layer_bw), layer->mPixFormat, bpp,
1301                     layer->mSourceRect.size.hori, layer->mSourceRect.size.vert,
1302                     layer->mSourceRect.pos.hori, layer->mSourceRect.pos.vert,
1303                     layer->mSourceDimension.hori, layer->mSourceDimension.vert,
1304                     layer->mTargetRect.size.hori, layer->mTargetRect.size.vert,
1305                     layer->mTargetRect.pos.hori, layer->mTargetRect.pos.vert, layer->mTransform);
1306         }
1307 
1308         bandwidth *= frame->mFrameRate;
1309         bandwidth >>= 17; // divide by 16(weight), 8(bpp) and 1024(kilobyte)
1310 
1311         data.frame[i].bandwidth_read = static_cast<uint32_t>(bandwidth);
1312 
1313         bpp = halfmt_bpp(frame->mTargetPixFormat);
1314         bandwidth = frame->mTargetDimension.hori * frame->mTargetDimension.vert;
1315         bandwidth *= frame->mFrameRate * bpp;
1316 
1317         // When src rotation is involved, src format includes yuv420(8bit-depth)
1318         // and dst format is yuv420(8bit-depth), weight to the write bandwidth is 2.
1319         // RSH 12 : bw * 2 / (bits_per_byte * kilobyte)
1320         // RHS 13 : bw * 1 / (bits_per_byte * kilobyte)
1321         bandwidth >>= ((bpp == 12) && src_yuv420_8b && src_rotate) ? 12 : 13;
1322         data.frame[i].bandwidth_write = static_cast<uint32_t>(bandwidth);
1323 
1324         if (frame->mHasBackgroundLayer)
1325             data.frame[i].frame_attr |= G2D_PERF_FRAME_SOLIDCOLORFILL;
1326 
1327         data.frame[i].num_layers = frame->getLayerCount();
1328         data.frame[i].target_pixelcount = frame->mTargetDimension.vert * frame->mTargetDimension.hori;
1329         data.frame[i].frame_rate = frame->mFrameRate;
1330 
1331         ALOGD_TEST("    FRAME[%d]: BW:(%u, %u) Layercount %d, Framerate %d, Target %dx%d, FMT %#x Background? %d",
1332             i, data.frame[i].bandwidth_read, data.frame[i].bandwidth_write, data.frame[i].num_layers, frame->mFrameRate,
1333             frame->mTargetDimension.hori, frame->mTargetDimension.vert, frame->mTargetPixFormat,
1334             frame->mHasBackgroundLayer);
1335     }
1336 
1337     data.num_frame = request->getFrameCount();
1338 
1339     if (mDev.ioctl(G2D_IOC_PERFORMANCE, &data) < 0) {
1340         ALOGERR("Failed to request performance");
1341         return false;
1342     }
1343 
1344     return true;
1345 }
1346 
prioritize(int priority)1347 int AcrylicCompositorG2D::prioritize(int priority)
1348 {
1349     static int32_t g2d_priorities[] = {
1350             G2D_LOW_PRIORITY,     // 0
1351             G2D_MEDIUM_PRIORITY,  // 1
1352             G2D_HIGH_PRIORITY,    // 2
1353     };
1354 
1355     if (priority == mPriority)
1356         return 0;
1357 
1358     if (Acrylic::prioritize(priority) < 0)
1359         return -1;
1360 
1361     int32_t arg;
1362 
1363     if (priority > 2)
1364         arg = G2D_HIGHEST_PRIORITY;
1365     else if (priority < 0)
1366         arg = G2D_DEFAULT_PRIORITY;
1367     else
1368         arg = g2d_priorities[priority];
1369 
1370     if (mDev.ioctl(G2D_IOC_PRIORITY, &arg) < 0) {
1371         if (errno != EBUSY) {
1372             ALOGERR("Failed to set priority on a context of G2D");
1373             return -1;
1374         }
1375 
1376         ALOGD("G2D Driver returned EBUSY but the priority of %d(%d) is successfully applied", priority, arg);
1377         return 1;
1378     }
1379 
1380     ALOGD_TEST("Applied the priority of %d(%d) successfully", priority, arg);
1381 
1382     mPriority = priority;
1383 
1384     return 0;
1385 }
1386